diff --git a/arabic/0.ckpt.h5 b/arabic/0.ckpt.h5 new file mode 100644 index 0000000..053e4a2 Binary files /dev/null and b/arabic/0.ckpt.h5 differ diff --git a/arabic/0.ckpt.json b/arabic/0.ckpt.json new file mode 100644 index 0000000..add72a5 --- /dev/null +++ b/arabic/0.ckpt.json @@ -0,0 +1,1031 @@ +{ + "model": { + "network": { + "layers": [ + { + "filters": 40, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "filters": 60, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "type": "LSTM", + "hiddenNodes": 200 + } + ], + "solver": "ADAM_SOLVER", + "dropout": 0.5, + "features": 48, + "classes": 150, + "backend": { + "cudnn": true, + "shuffleBufferSize": 1000 + }, + "ctcMergeRepeated": true, + "learningRate": 0.001, + "clippingNorm": 5.0 + }, + "lineHeight": 48, + "dataPreprocessor": { + "lineHeight": 48, + "pad": 16 + }, + "textPreprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER", + "bidiDirection": "BIDI_RTL" + } + ] + }, + "textPostprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER" + } + ] + }, + "codec": { + "charset": [ + "", + " ", + "!", + "'", + "(", + ")", + "*", + "+", + ",", + "-", + ".", + "/", + "0", + "1", + "2", + "3", + "4", + "5", + "6", + "7", + "8", + "9", + ":", + "<", + ">", + "A", + "B", + "C", + "D", + "E", + "H", + "I", + "K", + "L", + "M", + "N", + "O", + "P", + "R", + "S", + "T", + "U", + "V", + "X", + "[", + "]", + "_", + "a", + "b", + "c", + "d", + "e", + "f", + "g", + "h", + "i", + "j", + "l", + "m", + "n", + "o", + "p", + "q", + "r", + "s", + "t", + "u", + "v", + "x", + "y", + "{", + "|", + "}", + "~", + "\u028e", + "\u0391", + "\u0392", + "\u0398", + "\u0399", + "\u03a4", + "\u03b1", + "\u03b2", + "\u03b3", + "\u03b4", + "\u03b5", + "\u03b6", + "\u03b7", + "\u03b8", + "\u03b9", + "\u03bb", + "\u03bc", + "\u03bd", + "\u03be", + "\u03bf", + "\u03c0", + "\u03c1", + "\u03c3", + "\u03c4", + "\u03c5", + "\u03c7", + "\u03c8", + "\u03c9", + "\u060c", + "\u061b", + "\u061f", + "\u0621", + "\u0622", + "\u0623", + "\u0624", + "\u0625", + "\u0626", + "\u0627", + "\u0628", + "\u0629", + "\u062a", + "\u062b", + "\u062c", + "\u062d", + "\u062e", + "\u062f", + "\u0630", + "\u0631", + "\u0632", + "\u0633", + "\u0634", + "\u0635", + "\u0636", + "\u0637", + "\u0638", + "\u0639", + "\u063a", + "\u0640", + "\u0641", + "\u0642", + "\u0643", + "\u0644", + "\u0645", + "\u0646", + "\u0647", + "\u0648", + "\u0649", + "\u064a", + "\u064b", + "\u064c", + "\u064d", + "\u064e", + "\u064f", + "\u0650", + "\u0651", + "\u0652" + ] + } + }, + "processes": 1, + "maxIters": 10000000, + "skipInvalidGt": true, + "display": 500.0, + "statsSize": 100, + "batchSize": 1, + "checkpointFrequency": -1.0, + "iter": 145655, + "lossStats": [ + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity" + ], + "lerStats": [ + 0.10714286, + 0.0, + 0.0, + 0.07692308, + 0.0, + 0.027027028, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.020408163, + 0.014084507, + 0.42857143, + 0.0, + 0.013888889, + 0.015625, + 0.0, + 0.0, + 0.06666667, + 0.0, + 0.041666668, + 0.018181818, + 0.0, + 0.016949153, + 0.0, + 0.028985508, + 0.0, + 0.0, + 0.0, + 0.016666668, + 0.0, + 0.0121951215, + 0.0, + 0.0, + 0.02631579, + 0.0, + 0.03797468, + 0.0, + 0.0, + 0.028571429, + 0.0, + 0.0, + 0.22222222, + 0.0, + 0.0, + 0.028571429, + 0.0, + 0.012987013, + 0.016129032, + 0.0125, + 0.0, + 0.0, + 0.0, + 0.0, + 0.014084507, + 0.0125, + 0.0125, + 0.014084507, + 0.0, + 0.0, + 0.0, + 0.0, + 0.018867925, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.05, + 0.0, + 0.0, + 0.0, + 0.03125, + 0.0, + 0.0, + 0.013157895, + 0.01754386, + 0.0, + 0.0, + 0.0, + 0.0, + 0.057142857, + 0.11594203, + 0.0, + 0.0, + 0.04109589, + 0.0, + 0.0, + 0.0, + 0.0, + 0.14285715, + 0.0, + 0.018181818, + 0.0, + 0.015384615, + 0.06153846, + 0.0 + ], + "dtStats": [ + 0.019872427, + 0.019273043, + 0.019418478, + 0.015725851, + 0.019316673, + 0.019231796, + 0.017013073, + 0.015645742, + 0.012606144, + 0.024737358, + 0.016726732, + 0.0056824684, + 0.011679649, + 0.020799637, + 0.020661116, + 0.013441324, + 0.01749301, + 0.009653568, + 0.005949497, + 0.019438744, + 0.013981819, + 0.011568308, + 0.017554283, + 0.022220373, + 0.0210042, + 0.021757364, + 0.007322073, + 0.00734663, + 0.018117905, + 0.018877506, + 0.017254114, + 0.021746159, + 0.015915155, + 0.01168561, + 0.01970005, + 0.017407179, + 0.01659298, + 0.0056271553, + 0.017860413, + 0.017513275, + 0.020680904, + 0.018809795, + 0.027515411, + 0.005841732, + 0.01919794, + 0.016146183, + 0.017425776, + 0.02034545, + 0.017019987, + 0.020632505, + 0.019468784, + 0.016881704, + 0.019638538, + 0.01737237, + 0.019996166, + 0.019107819, + 0.018211365, + 0.018561363, + 0.009345055, + 0.017338037, + 0.020765066, + 0.023724556, + 0.018580914, + 0.0063130856, + 0.018755198, + 0.018095016, + 0.018758774, + 0.011855841, + 0.013149023, + 0.021172285, + 0.018042088, + 0.0050797462, + 0.0061802864, + 0.009308815, + 0.016502142, + 0.016630888, + 0.016345501, + 0.034225225, + 0.020647764, + 0.014774084, + 0.018321276, + 0.018166542, + 0.016455889, + 0.016796112, + 0.023615599, + 0.020033836, + 0.019813776, + 0.019940376, + 0.00578475, + 0.008072376, + 0.012652397, + 0.04093194, + 0.017230988, + 0.023439884, + 0.020038843, + 0.019645214, + 0.013179302, + 0.0049943924, + 0.01782918, + 0.018062115 + ], + "totalTime": 2836.8252, + "earlyStoppingFrequency": -1.0, + "earlyStoppingNbest": 5, + "earlyStoppingBestModelPrefix": "best_arabic_new_1_", + "earlyStoppingBestAccuracy": 0.98018354, + "earlyStoppingBestCurNbest": 1, + "earlyStoppingBestAtIter": 145656, + "outputModelPrefix": "arabic_new_1_", + "dataAugRetrainOnOriginal": true, + "version": 2 +} \ No newline at end of file diff --git a/arabic/1.ckpt.h5 b/arabic/1.ckpt.h5 new file mode 100644 index 0000000..0993cf4 Binary files /dev/null and b/arabic/1.ckpt.h5 differ diff --git a/arabic/1.ckpt.json b/arabic/1.ckpt.json new file mode 100644 index 0000000..79390d6 --- /dev/null +++ b/arabic/1.ckpt.json @@ -0,0 +1,1031 @@ +{ + "model": { + "network": { + "layers": [ + { + "filters": 40, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "filters": 60, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "type": "LSTM", + "hiddenNodes": 200 + } + ], + "solver": "ADAM_SOLVER", + "dropout": 0.5, + "features": 48, + "classes": 150, + "backend": { + "cudnn": true, + "shuffleBufferSize": 1000 + }, + "ctcMergeRepeated": true, + "learningRate": 0.001, + "clippingNorm": 5.0 + }, + "lineHeight": 48, + "dataPreprocessor": { + "lineHeight": 48, + "pad": 16 + }, + "textPreprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER", + "bidiDirection": "BIDI_RTL" + } + ] + }, + "textPostprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER" + } + ] + }, + "codec": { + "charset": [ + "", + " ", + "!", + "'", + "(", + ")", + "*", + "+", + ",", + "-", + ".", + "/", + "0", + "1", + "2", + "3", + "4", + "5", + "6", + "7", + "8", + "9", + ":", + "<", + ">", + "A", + "B", + "C", + "D", + "E", + "H", + "I", + "K", + "L", + "M", + "N", + "O", + "P", + "R", + "S", + "T", + "U", + "V", + "X", + "[", + "]", + "_", + "a", + "b", + "c", + "d", + "e", + "f", + "g", + "h", + "i", + "j", + "l", + "m", + "n", + "o", + "p", + "q", + "r", + "s", + "t", + "u", + "v", + "x", + "y", + "{", + "|", + "}", + "~", + "\u028e", + "\u0391", + "\u0392", + "\u0398", + "\u0399", + "\u03a4", + "\u03b1", + "\u03b2", + "\u03b3", + "\u03b4", + "\u03b5", + "\u03b6", + "\u03b7", + "\u03b8", + "\u03b9", + "\u03bb", + "\u03bc", + "\u03bd", + "\u03be", + "\u03bf", + "\u03c0", + "\u03c1", + "\u03c3", + "\u03c4", + "\u03c5", + "\u03c7", + "\u03c8", + "\u03c9", + "\u060c", + "\u061b", + "\u061f", + "\u0621", + "\u0622", + "\u0623", + "\u0624", + "\u0625", + "\u0626", + "\u0627", + "\u0628", + "\u0629", + "\u062a", + "\u062b", + "\u062c", + "\u062d", + "\u062e", + "\u062f", + "\u0630", + "\u0631", + "\u0632", + "\u0633", + "\u0634", + "\u0635", + "\u0636", + "\u0637", + "\u0638", + "\u0639", + "\u063a", + "\u0640", + "\u0641", + "\u0642", + "\u0643", + "\u0644", + "\u0645", + "\u0646", + "\u0647", + "\u0648", + "\u0649", + "\u064a", + "\u064b", + "\u064c", + "\u064d", + "\u064e", + "\u064f", + "\u0650", + "\u0651", + "\u0652" + ] + } + }, + "processes": 1, + "maxIters": 10000000, + "skipInvalidGt": true, + "display": 500.0, + "statsSize": 100, + "batchSize": 1, + "checkpointFrequency": -1.0, + "iter": 364139, + "lossStats": [ + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity" + ], + "lerStats": [ + 0.0125, + 0.0, + 0.014084507, + 0.013888889, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.14285715, + 0.0, + 0.03125, + 0.039473683, + 0.050847456, + 0.014285714, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.05882353, + 0.016393442, + 0.013888889, + 0.0, + 0.0, + 0.013157895, + 0.0, + 0.018518519, + 0.0, + 0.0, + 0.0, + 0.14285715, + 0.02739726, + 0.0, + 0.024691358, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.016393442, + 0.0, + 0.0, + 0.07575758, + 0.0, + 0.018181818, + 0.0125, + 0.0, + 0.014084507, + 0.0, + 0.019607844, + 0.014492754, + 0.0, + 0.06666667, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.014285714, + 0.0, + 0.016129032, + 0.0, + 0.03448276, + 0.040816326, + 0.0, + 0.035714287, + 0.0, + 0.014492754, + 0.0, + 0.014285714, + 0.0, + 0.030303031, + 0.0, + 0.0, + 0.0, + 0.0, + 0.028985508, + 0.0, + 0.01369863, + 0.0, + 0.0, + 0.0, + 0.0, + 0.013157895, + 0.0, + 0.37313432, + 0.01724138, + 0.0, + 0.0, + 0.0, + 0.0, + 0.024691358, + 0.0, + 0.0 + ], + "dtStats": [ + 0.020548582, + 0.024151087, + 0.018998384, + 0.024532318, + 0.0121665, + 0.022799969, + 0.018761635, + 0.012409687, + 0.0086426735, + 0.018665314, + 0.0074071884, + 0.022366524, + 0.006526947, + 0.019050121, + 0.01851964, + 0.030644655, + 0.018973827, + 0.018301964, + 0.008334875, + 0.016488552, + 0.017866611, + 0.018051386, + 0.018445492, + 0.005964279, + 0.016885042, + 0.020151138, + 0.009068966, + 0.0073046684, + 0.012806416, + 0.018693686, + 0.011739016, + 0.020257235, + 0.013377428, + 0.0067048073, + 0.020016193, + 0.015402317, + 0.016568422, + 0.0055520535, + 0.019150019, + 0.013192177, + 0.008799076, + 0.017703056, + 0.018449306, + 0.013607264, + 0.012646675, + 0.019927263, + 0.016787052, + 0.019129276, + 0.018533707, + 0.016440868, + 0.018056631, + 0.016275883, + 0.03199935, + 0.018316984, + 0.010939121, + 0.006030798, + 0.02448368, + 0.018026352, + 0.006620407, + 0.03868389, + 0.0076663494, + 0.008718967, + 0.012265682, + 0.019070625, + 0.015349627, + 0.01916933, + 0.015798569, + 0.018906832, + 0.01205039, + 0.01603198, + 0.0216434, + 0.010089874, + 0.008769035, + 0.0069196224, + 0.017931938, + 0.015124083, + 0.010510445, + 0.0073559284, + 0.01695323, + 0.01746273, + 0.024890184, + 0.020240784, + 0.017248392, + 0.01954937, + 0.017904758, + 0.017355442, + 0.017011166, + 0.030165195, + 0.0073611736, + 0.016207933, + 0.020910025, + 0.011872292, + 0.01940775, + 0.025356293, + 0.012863636, + 0.008835077, + 0.01438427, + 0.014754772, + 0.020546198, + 0.017948389 + ], + "totalTime": 7054.3584, + "earlyStoppingFrequency": -1.0, + "earlyStoppingNbest": 5, + "earlyStoppingBestModelPrefix": "best_arabic_new_2_", + "earlyStoppingBestAccuracy": 0.97573453, + "earlyStoppingBestCurNbest": 1, + "earlyStoppingBestAtIter": 364140, + "outputModelPrefix": "arabic_new_2_", + "dataAugRetrainOnOriginal": true, + "version": 2 +} \ No newline at end of file diff --git a/arabic/2.ckpt.h5 b/arabic/2.ckpt.h5 new file mode 100644 index 0000000..2fa2fc8 Binary files /dev/null and b/arabic/2.ckpt.h5 differ diff --git a/arabic/2.ckpt.json b/arabic/2.ckpt.json new file mode 100644 index 0000000..ba6de96 --- /dev/null +++ b/arabic/2.ckpt.json @@ -0,0 +1,1031 @@ +{ + "model": { + "network": { + "layers": [ + { + "filters": 40, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "filters": 60, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "type": "LSTM", + "hiddenNodes": 200 + } + ], + "solver": "ADAM_SOLVER", + "dropout": 0.5, + "features": 48, + "classes": 150, + "backend": { + "cudnn": true, + "shuffleBufferSize": 1000 + }, + "ctcMergeRepeated": true, + "learningRate": 0.001, + "clippingNorm": 5.0 + }, + "lineHeight": 48, + "dataPreprocessor": { + "lineHeight": 48, + "pad": 16 + }, + "textPreprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER", + "bidiDirection": "BIDI_RTL" + } + ] + }, + "textPostprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER" + } + ] + }, + "codec": { + "charset": [ + "", + " ", + "!", + "'", + "(", + ")", + "*", + "+", + ",", + "-", + ".", + "/", + "0", + "1", + "2", + "3", + "4", + "5", + "6", + "7", + "8", + "9", + ":", + "<", + ">", + "A", + "B", + "C", + "D", + "E", + "H", + "I", + "K", + "L", + "M", + "N", + "O", + "P", + "R", + "S", + "T", + "U", + "V", + "X", + "[", + "]", + "_", + "a", + "b", + "c", + "d", + "e", + "f", + "g", + "h", + "i", + "j", + "l", + "m", + "n", + "o", + "p", + "q", + "r", + "s", + "t", + "u", + "v", + "x", + "y", + "{", + "|", + "}", + "~", + "\u028e", + "\u0391", + "\u0392", + "\u0398", + "\u0399", + "\u03a4", + "\u03b1", + "\u03b2", + "\u03b3", + "\u03b4", + "\u03b5", + "\u03b6", + "\u03b7", + "\u03b8", + "\u03b9", + "\u03bb", + "\u03bc", + "\u03bd", + "\u03be", + "\u03bf", + "\u03c0", + "\u03c1", + "\u03c3", + "\u03c4", + "\u03c5", + "\u03c7", + "\u03c8", + "\u03c9", + "\u060c", + "\u061b", + "\u061f", + "\u0621", + "\u0622", + "\u0623", + "\u0624", + "\u0625", + "\u0626", + "\u0627", + "\u0628", + "\u0629", + "\u062a", + "\u062b", + "\u062c", + "\u062d", + "\u062e", + "\u062f", + "\u0630", + "\u0631", + "\u0632", + "\u0633", + "\u0634", + "\u0635", + "\u0636", + "\u0637", + "\u0638", + "\u0639", + "\u063a", + "\u0640", + "\u0641", + "\u0642", + "\u0643", + "\u0644", + "\u0645", + "\u0646", + "\u0647", + "\u0648", + "\u0649", + "\u064a", + "\u064b", + "\u064c", + "\u064d", + "\u064e", + "\u064f", + "\u0650", + "\u0651", + "\u0652" + ] + } + }, + "processes": 1, + "maxIters": 10000000, + "skipInvalidGt": true, + "display": 500.0, + "statsSize": 100, + "batchSize": 1, + "checkpointFrequency": -1.0, + "iter": 145655, + "lossStats": [ + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity" + ], + "lerStats": [ + 0.01369863, + 0.016949153, + 0.0, + 0.0, + 0.0, + 0.013157895, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0125, + 0.0, + 0.0, + 0.0, + 0.0125, + 0.0, + 0.0, + 0.027027028, + 0.073529415, + 0.0, + 0.014492754, + 0.0, + 0.03846154, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.033333335, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.6666667, + 0.0, + 0.0, + 0.013888889, + 0.0, + 0.0, + 0.014285714, + 0.0, + 0.0, + 0.025, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.023255814, + 0.0, + 0.6666667, + 0.0, + 0.0, + 0.0, + 0.0, + 0.014705882, + 0.0, + 0.02739726, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0952381, + 0.0, + 0.0, + 0.04347826, + 0.0, + 0.0, + 0.0, + 0.0, + 0.04477612, + 0.0, + 0.0, + 0.014925373, + 0.012987013, + 0.015625, + 0.0 + ], + "dtStats": [ + 0.01930213, + 0.019165993, + 0.015349388, + 0.017691612, + 0.0152812, + 0.020575523, + 0.01828909, + 0.017749071, + 0.016619205, + 0.021256685, + 0.012275457, + 0.013953924, + 0.01759696, + 0.016159773, + 0.020910263, + 0.018269539, + 0.008505106, + 0.013687611, + 0.020164967, + 0.015257835, + 0.016673803, + 0.017296314, + 0.008207798, + 0.019286394, + 0.017681122, + 0.016113281, + 0.02005601, + 0.019693613, + 0.01119256, + 0.020454168, + 0.032533407, + 0.006988764, + 0.0065248013, + 0.01858759, + 0.012365103, + 0.010347843, + 0.014660835, + 0.02104187, + 0.021223307, + 0.013328314, + 0.020009756, + 0.017448187, + 0.017878532, + 0.018936157, + 0.0064225197, + 0.019128084, + 0.009780645, + 0.017853022, + 0.01812005, + 0.018401384, + 0.017805338, + 0.018785477, + 0.018678665, + 0.021162033, + 0.01905489, + 0.0052731037, + 0.020580053, + 0.01871872, + 0.018387318, + 0.011866331, + 0.01997137, + 0.019187927, + 0.019408703, + 0.01902175, + 0.018125772, + 0.01790595, + 0.018936634, + 0.010565996, + 0.018078804, + 0.0071713924, + 0.016238451, + 0.02021432, + 0.020869255, + 0.020165205, + 0.03023386, + 0.012555361, + 0.017957449, + 0.0210073, + 0.02121687, + 0.017501116, + 0.017839432, + 0.008218765, + 0.018244982, + 0.01949668, + 0.019680262, + 0.015305996, + 0.020093918, + 0.019319296, + 0.018457413, + 0.01641655, + 0.014648199, + 0.019173384, + 0.014424086, + 0.018701315, + 0.02777481, + 0.013977051, + 0.01742673, + 0.018341303, + 0.013790131, + 0.025485516 + ], + "totalTime": 2854.496, + "earlyStoppingFrequency": -1.0, + "earlyStoppingNbest": 5, + "earlyStoppingBestModelPrefix": "best_arabic_new_3_", + "earlyStoppingBestAccuracy": 0.97714645, + "earlyStoppingBestCurNbest": 1, + "earlyStoppingBestAtIter": 145656, + "outputModelPrefix": "arabic_new_3_", + "dataAugRetrainOnOriginal": true, + "version": 2 +} \ No newline at end of file diff --git a/arabic/3.ckpt.h5 b/arabic/3.ckpt.h5 new file mode 100644 index 0000000..54b1ff8 Binary files /dev/null and b/arabic/3.ckpt.h5 differ diff --git a/arabic/3.ckpt.json b/arabic/3.ckpt.json new file mode 100644 index 0000000..1363253 --- /dev/null +++ b/arabic/3.ckpt.json @@ -0,0 +1,1031 @@ +{ + "model": { + "network": { + "layers": [ + { + "filters": 40, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "filters": 60, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "type": "LSTM", + "hiddenNodes": 200 + } + ], + "solver": "ADAM_SOLVER", + "dropout": 0.5, + "features": 48, + "classes": 150, + "backend": { + "cudnn": true, + "shuffleBufferSize": 1000 + }, + "ctcMergeRepeated": true, + "learningRate": 0.001, + "clippingNorm": 5.0 + }, + "lineHeight": 48, + "dataPreprocessor": { + "lineHeight": 48, + "pad": 16 + }, + "textPreprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER", + "bidiDirection": "BIDI_RTL" + } + ] + }, + "textPostprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER" + } + ] + }, + "codec": { + "charset": [ + "", + " ", + "!", + "'", + "(", + ")", + "*", + "+", + ",", + "-", + ".", + "/", + "0", + "1", + "2", + "3", + "4", + "5", + "6", + "7", + "8", + "9", + ":", + "<", + ">", + "A", + "B", + "C", + "D", + "E", + "H", + "I", + "K", + "L", + "M", + "N", + "O", + "P", + "R", + "S", + "T", + "U", + "V", + "X", + "[", + "]", + "_", + "a", + "b", + "c", + "d", + "e", + "f", + "g", + "h", + "i", + "j", + "l", + "m", + "n", + "o", + "p", + "q", + "r", + "s", + "t", + "u", + "v", + "x", + "y", + "{", + "|", + "}", + "~", + "\u028e", + "\u0391", + "\u0392", + "\u0398", + "\u0399", + "\u03a4", + "\u03b1", + "\u03b2", + "\u03b3", + "\u03b4", + "\u03b5", + "\u03b6", + "\u03b7", + "\u03b8", + "\u03b9", + "\u03bb", + "\u03bc", + "\u03bd", + "\u03be", + "\u03bf", + "\u03c0", + "\u03c1", + "\u03c3", + "\u03c4", + "\u03c5", + "\u03c7", + "\u03c8", + "\u03c9", + "\u060c", + "\u061b", + "\u061f", + "\u0621", + "\u0622", + "\u0623", + "\u0624", + "\u0625", + "\u0626", + "\u0627", + "\u0628", + "\u0629", + "\u062a", + "\u062b", + "\u062c", + "\u062d", + "\u062e", + "\u062f", + "\u0630", + "\u0631", + "\u0632", + "\u0633", + "\u0634", + "\u0635", + "\u0636", + "\u0637", + "\u0638", + "\u0639", + "\u063a", + "\u0640", + "\u0641", + "\u0642", + "\u0643", + "\u0644", + "\u0645", + "\u0646", + "\u0647", + "\u0648", + "\u0649", + "\u064a", + "\u064b", + "\u064c", + "\u064d", + "\u064e", + "\u064f", + "\u0650", + "\u0651", + "\u0652" + ] + } + }, + "processes": 1, + "maxIters": 10000000, + "skipInvalidGt": true, + "display": 500.0, + "statsSize": 100, + "batchSize": 1, + "checkpointFrequency": -1.0, + "iter": 145655, + "lossStats": [ + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity", + "Infinity" + ], + "lerStats": [ + 0.0, + 0.0, + 0.0, + 0.0, + 0.014084507, + 0.0, + 0.0, + 0.015384615, + 0.0, + 0.0, + 0.078125, + 0.0, + 0.0, + 0.0, + 0.028985508, + 0.0, + 0.0, + 0.060606062, + 0.02739726, + 0.0, + 0.07462686, + 0.0, + 0.6666667, + 0.013888889, + 0.0, + 0.0, + 0.014925373, + 0.023809524, + 0.06849315, + 0.0125, + 0.0, + 0.05479452, + 0.0, + 0.0, + 0.015384615, + 0.0, + 0.014084507, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.09615385, + 0.0, + 0.0, + 0.0, + 0.03773585, + 0.0, + 0.0, + 0.0, + 0.2923077, + 0.08219178, + 0.0, + 0.2923077, + 0.0, + 0.0, + 0.1, + 0.0121951215, + 0.2631579, + 0.014492754, + 0.03125, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.044444446, + 0.0, + 0.0, + 0.0, + 0.028169014, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.14754099, + 0.015625, + 0.0, + 0.06122449, + 0.0, + 0.08695652, + 0.013888889, + 0.08196721, + 0.0, + 0.0, + 0.0, + 0.014084507, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "dtStats": [ + 0.0058140755, + 0.019767046, + 0.018239498, + 0.017900705, + 0.011180162, + 0.015616655, + 0.024158001, + 0.018197775, + 0.019973993, + 0.017692327, + 0.017540693, + 0.020246267, + 0.018060207, + 0.015184164, + 0.01999259, + 0.013505697, + 0.012892246, + 0.016251802, + 0.012347221, + 0.022394896, + 0.019113779, + 0.016187191, + 0.029903173, + 0.018415928, + 0.01743579, + 0.007453203, + 0.017097712, + 0.018715143, + 0.010941267, + 0.017695904, + 0.021075964, + 0.019222736, + 0.012110472, + 0.018174648, + 0.02011919, + 0.00896287, + 0.019127607, + 0.011254549, + 0.017180443, + 0.017914534, + 0.020277739, + 0.011871576, + 0.017511606, + 0.00698328, + 0.017426014, + 0.01917839, + 0.016541958, + 0.02371192, + 0.013701439, + 0.018181086, + 0.020401478, + 0.018236876, + 0.018331766, + 0.027264833, + 0.021715641, + 0.019104958, + 0.019204855, + 0.018625736, + 0.01859355, + 0.019647121, + 0.0072772503, + 0.020766258, + 0.020242214, + 0.020331621, + 0.034778118, + 0.021614313, + 0.031645536, + 0.018854856, + 0.027505875, + 0.022850037, + 0.02603364, + 0.017315865, + 0.01750803, + 0.01704526, + 0.012205124, + 0.016041756, + 0.019093752, + 0.018479586, + 0.024113178, + 0.016685486, + 0.014503717, + 0.018350363, + 0.018046618, + 0.006398678, + 0.018673658, + 0.019562483, + 0.014853716, + 0.017436981, + 0.020964384, + 0.017809153, + 0.02081561, + 0.020207167, + 0.0072407722, + 0.007790327, + 0.021091938, + 0.009856701, + 0.016828537, + 0.014018297, + 0.019638777, + 0.021436691 + ], + "totalTime": 2838.6177, + "earlyStoppingFrequency": -1.0, + "earlyStoppingNbest": 5, + "earlyStoppingBestModelPrefix": "best_arabic_new_4_", + "earlyStoppingBestAccuracy": 0.9755408, + "earlyStoppingBestCurNbest": 1, + "earlyStoppingBestAtIter": 145656, + "outputModelPrefix": "arabic_new_4_", + "dataAugRetrainOnOriginal": true, + "version": 2 +} \ No newline at end of file diff --git a/arabic/4.ckpt.h5 b/arabic/4.ckpt.h5 new file mode 100644 index 0000000..1da8646 Binary files /dev/null and b/arabic/4.ckpt.h5 differ diff --git a/arabic/4.ckpt.json b/arabic/4.ckpt.json new file mode 100644 index 0000000..f124e32 --- /dev/null +++ b/arabic/4.ckpt.json @@ -0,0 +1,1031 @@ +{ + "model": { + "network": { + "layers": [ + { + "filters": 40, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "filters": 60, + "kernelSize": { + "x": 3, + "y": 3 + }, + "stride": { + "x": 1, + "y": 1 + } + }, + { + "type": "MAX_POOLING", + "kernelSize": { + "x": 2, + "y": 2 + }, + "stride": { + "x": 2, + "y": 2 + } + }, + { + "type": "LSTM", + "hiddenNodes": 200 + } + ], + "solver": "ADAM_SOLVER", + "dropout": 0.5, + "features": 48, + "classes": 150, + "backend": { + "cudnn": true, + "shuffleBufferSize": 1000 + }, + "ctcMergeRepeated": true, + "learningRate": 0.001, + "clippingNorm": 5.0 + }, + "lineHeight": 48, + "dataPreprocessor": { + "lineHeight": 48, + "pad": 16 + }, + "textPreprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER", + "bidiDirection": "BIDI_RTL" + } + ] + }, + "textPostprocessor": { + "type": "MULTI_NORMALIZER", + "children": [ + { + "type": "TEXT_NORMALIZER" + }, + { + "type": "TEXT_REGULARIZER", + "replacements": [ + { + "old": "\u00b5", + "new": "\u03bc" + }, + { + "old": "\u2013\u2014\u2014", + "new": "-" + }, + { + "old": "\u2013\u2014", + "new": "-" + }, + { + "old": "\"", + "new": "''" + }, + { + "old": "`", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u00b4", + "new": "'" + }, + { + "old": "\u2018", + "new": "'" + }, + { + "old": "\u2019", + "new": "'" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201d", + "new": "''" + }, + { + "old": "\u201c", + "new": "''" + }, + { + "old": "\u201e", + "new": ",," + }, + { + "old": "\u2026", + "new": "..." + }, + { + "old": "\u2032", + "new": "'" + }, + { + "old": "\u2033", + "new": "''" + }, + { + "old": "\u2034", + "new": "'''" + }, + { + "old": "\u3003", + "new": "''" + }, + { + "old": "\u2160", + "new": "I" + }, + { + "old": "\u2161", + "new": "II" + }, + { + "old": "\u2162", + "new": "III" + }, + { + "old": "\u2163", + "new": "IV" + }, + { + "old": "\u2164", + "new": "V" + }, + { + "old": "\u2165", + "new": "VI" + }, + { + "old": "\u2166", + "new": "VII" + }, + { + "old": "\u2167", + "new": "VIII" + }, + { + "old": "\u2168", + "new": "IX" + }, + { + "old": "\u2169", + "new": "X" + }, + { + "old": "\u216a", + "new": "XI" + }, + { + "old": "\u216b", + "new": "XII" + }, + { + "old": "\u216c", + "new": "L" + }, + { + "old": "\u216d", + "new": "C" + }, + { + "old": "\u216e", + "new": "D" + }, + { + "old": "\u216f", + "new": "M" + }, + { + "old": "\u2170", + "new": "i" + }, + { + "old": "\u2171", + "new": "ii" + }, + { + "old": "\u2172", + "new": "iii" + }, + { + "old": "\u2173", + "new": "iv" + }, + { + "old": "\u2174", + "new": "v" + }, + { + "old": "\u2175", + "new": "vi" + }, + { + "old": "\u2176", + "new": "vii" + }, + { + "old": "\u2177", + "new": "viii" + }, + { + "old": "\u2178", + "new": "ix" + }, + { + "old": "\u2179", + "new": "x" + }, + { + "old": "\u217a", + "new": "xi" + }, + { + "old": "\u217b", + "new": "xii" + }, + { + "old": "\u217c", + "new": "l" + }, + { + "old": "\u217d", + "new": "c" + }, + { + "old": "\u217e", + "new": "d" + }, + { + "old": "\u217f", + "new": "m" + }, + { + "old": "\\s+(?u)", + "new": " ", + "regex": true + }, + { + "old": "\\n(?u)", + "regex": true + }, + { + "old": "^\\s+(?u)", + "regex": true + }, + { + "old": "\\s+$(?u)", + "regex": true + } + ] + }, + { + "type": "STRIP_NORMALIZER" + }, + { + "type": "BIDI_NORMALIZER" + } + ] + }, + "codec": { + "charset": [ + "", + " ", + "!", + "'", + "(", + ")", + "*", + "+", + ",", + "-", + ".", + "/", + "0", + "1", + "2", + "3", + "4", + "5", + "6", + "7", + "8", + "9", + ":", + "<", + ">", + "A", + "B", + "C", + "D", + "E", + "H", + "I", + "K", + "L", + "M", + "N", + "O", + "P", + "R", + "S", + "T", + "U", + "V", + "X", + "[", + "]", + "_", + "a", + "b", + "c", + "d", + "e", + "f", + "g", + "h", + "i", + "j", + "l", + "m", + "n", + "o", + "p", + "q", + "r", + "s", + "t", + "u", + "v", + "x", + "y", + "{", + "|", + "}", + "~", + "\u028e", + "\u0391", + "\u0392", + "\u0398", + "\u0399", + "\u03a4", + "\u03b1", + "\u03b2", + "\u03b3", + "\u03b4", + "\u03b5", + "\u03b6", + "\u03b7", + "\u03b8", + "\u03b9", + "\u03bb", + "\u03bc", + "\u03bd", + "\u03be", + "\u03bf", + "\u03c0", + "\u03c1", + "\u03c3", + "\u03c4", + "\u03c5", + "\u03c7", + "\u03c8", + "\u03c9", + "\u060c", + "\u061b", + "\u061f", + "\u0621", + "\u0622", + "\u0623", + "\u0624", + "\u0625", + "\u0626", + "\u0627", + "\u0628", + "\u0629", + "\u062a", + "\u062b", + "\u062c", + "\u062d", + "\u062e", + "\u062f", + "\u0630", + "\u0631", + "\u0632", + "\u0633", + "\u0634", + "\u0635", + "\u0636", + "\u0637", + "\u0638", + "\u0639", + "\u063a", + "\u0640", + "\u0641", + "\u0642", + "\u0643", + "\u0644", + "\u0645", + "\u0646", + "\u0647", + "\u0648", + "\u0649", + "\u064a", + "\u064b", + "\u064c", + "\u064d", + "\u064e", + "\u064f", + "\u0650", + "\u0651", + "\u0652" + ] + } + }, + "processes": 1, + "maxIters": 10000000, + "skipInvalidGt": true, + "display": 500.0, + "statsSize": 100, + "batchSize": 1, + "checkpointFrequency": -1.0, + "iter": 72827, + "lossStats": [ + 9.23457, + 9.234443, + 9.234325, + 9.234199, + 9.234205, + 9.234083, + 9.233957, + 9.233834, + 9.233707, + 9.233654, + 9.233805, + 9.233685, + 9.23357, + 9.234143, + 9.234207, + 9.234351, + 9.234278, + 9.234237, + 9.234119, + 9.233993, + 9.233903, + 9.233826, + 9.233699, + 9.233574, + 9.233509, + 9.233391, + 9.233332, + 9.23321, + 9.233085, + 9.232959, + 9.232868, + 9.232828, + 9.232701, + 9.232577, + 9.232766, + 9.232774, + 9.232651, + 9.232747, + 9.232629, + 9.232511, + 9.232426, + 9.232299, + 9.232178, + 9.232052, + 9.231926, + 9.232586, + 9.232473, + 9.2323475, + 9.232222, + 9.23212, + 9.232019, + 9.231896, + 9.231773, + 9.231689, + 9.231565, + 9.231782, + 9.23166, + 9.231647, + 9.2315235, + 9.231618, + 9.2315035, + 9.231385, + 9.231313, + 9.231195, + 9.231092, + 9.23098, + 9.230858, + 9.230732, + 9.230651, + 9.230528, + 9.230543, + 9.230946, + 9.230826, + 9.2307005, + 9.230575, + 9.230448, + 9.2303505, + 9.230283, + 9.230166, + 9.2300415, + 9.229918, + 9.229792, + 9.230188, + 9.230249, + 9.230124, + 9.230004, + 9.229878, + 9.229762, + 9.229643, + 9.229518, + 9.229397, + 9.229304, + 9.229181, + 9.229339, + 9.229262, + 9.229164, + 9.229041, + 9.228993, + 9.2288685, + 9.228743 + ], + "lerStats": [ + 0.014492754, + 0.0, + 0.0, + 0.0, + 0.016393442, + 0.06451613, + 0.015625, + 0.015873017, + 0.030303031, + 0.011904762, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.018518519, + 0.014925373, + 0.013513514, + 0.02631579, + 0.014925373, + 0.0, + 0.013513514, + 0.114754096, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.03508772, + 0.0, + 0.014705882, + 0.016129032, + 0.0, + 0.013157895, + 0.0, + 0.0, + 0.08108108, + 0.0, + 0.015625, + 0.11111111, + 0.015151516, + 0.013513514, + 0.0, + 0.0, + 0.0, + 0.021276595, + 0.0, + 0.0, + 0.04477612, + 0.0, + 0.0, + 0.0, + 0.05263158, + 0.016949153, + 0.0, + 0.0, + 0.027777778, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.5, + 0.0, + 0.014492754, + 0.0952381, + 0.013157895, + 0.0, + 0.0, + 0.0, + 0.0, + 0.015384615, + 0.0, + 0.0, + 0.0, + 0.0, + 0.032786883, + 0.0, + 0.0, + 0.026666667, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.0, + 0.09615385, + 0.051282052, + 0.0, + 0.01724138, + 0.0, + 0.020408163, + 0.0, + 0.0, + 0.0, + 0.0 + ], + "dtStats": [ + 0.016378641, + 0.010848761, + 0.017914772, + 0.0055322647, + 0.013147116, + 0.012754917, + 0.01986289, + 0.021896124, + 0.005666256, + 0.015281677, + 0.02042842, + 0.016662598, + 0.008829832, + 0.015431404, + 0.01879716, + 0.018676043, + 0.017816544, + 0.015969992, + 0.019553661, + 0.006099701, + 0.01653862, + 0.028153896, + 0.01952076, + 0.019132376, + 0.030956745, + 0.017597675, + 0.028497458, + 0.016227245, + 0.015378475, + 0.010859728, + 0.017202616, + 0.01342082, + 0.017837763, + 0.019812346, + 0.020241976, + 0.01581049, + 0.017730236, + 0.0069777966, + 0.020970821, + 0.011835575, + 0.01768303, + 0.016471148, + 0.011403084, + 0.0133059025, + 0.008870363, + 0.012223244, + 0.027717352, + 0.01839161, + 0.018465996, + 0.014497042, + 0.016876936, + 0.019123793, + 0.017182112, + 0.02193904, + 0.017933607, + 0.016011, + 0.017465115, + 0.017858267, + 0.00611639, + 0.016758442, + 0.01816845, + 0.020523548, + 0.006071329, + 0.02074194, + 0.019769192, + 0.03070712, + 0.009758472, + 0.013127565, + 0.018982887, + 0.01845789, + 0.01710558, + 0.01458931, + 0.010099411, + 0.010418177, + 0.020358086, + 0.006326437, + 0.017245054, + 0.025384426, + 0.012755156, + 0.018000603, + 0.017271996, + 0.03046441, + 0.023336172, + 0.017164707, + 0.020392895, + 0.015864372, + 0.008839607, + 0.019475222, + 0.018908262, + 0.018733263, + 0.020027399, + 0.007179737, + 0.034102917, + 0.012349606, + 0.00825429, + 0.019454956, + 0.00897789, + 0.018138885, + 0.016556025, + 0.006004572 + ], + "totalTime": 1447.2695, + "earlyStoppingFrequency": -1.0, + "earlyStoppingNbest": 5, + "earlyStoppingBestModelPrefix": "best_arabic_new_5_", + "earlyStoppingBestAccuracy": 0.97983897, + "earlyStoppingBestCurNbest": 1, + "earlyStoppingBestAtIter": 72828, + "outputModelPrefix": "arabic_new_5_", + "dataAugRetrainOnOriginal": true, + "version": 2 +} \ No newline at end of file