From 98f1aeae197e34919b825b7fbe3a6f9e130c0067 Mon Sep 17 00:00:00 2001 From: sai-prasanna Date: Wed, 27 Nov 2019 16:23:36 +0530 Subject: [PATCH] Update to v0.2.0 Rename spacy model with `en_core_web_sm`. Fix special token handling for transformers lm. Update todos in readme.md. --- README.md | 10 +++--- lmproof/candidate_generators.py | 2 +- lmproof/scorer.py | 8 +++-- poetry.lock | 56 ++++++++++++++++++++------------- pyproject.toml | 2 +- 5 files changed, 46 insertions(+), 32 deletions(-) diff --git a/README.md b/README.md index 3d504bf..c6ac445 100644 --- a/README.md +++ b/README.md @@ -26,8 +26,6 @@ Unlike many approaches to GEC, this approach does NOT require annotated training This work builds upon https://github.com/chrisjbryant/lmgec-lite/ - - ## Components ### Language Models @@ -42,8 +40,8 @@ Pre-trained language models for other languages, inflectors, common error patter ## TODOs -* Research on distilling gpt-2 to a smaller model (LSTM?) to reduce the horrendous latency. -* Experiment on GEC dev sets to obtain optimal thresholds. -* Anyway to handle insertions. +* Use edits in existing GEC corpus to generate candidates. +* Tests +* Publish benchmarks of the model. +* Think of simple ways to generate insertion candidates. * Add more languages. -* Check whether LemmInflect proposals are actually better than just using [AGID](https://github.com/sai-prasanna/lmgec-lite/tree/master/resources/agid-2016.01.19). \ No newline at end of file diff --git a/lmproof/candidate_generators.py b/lmproof/candidate_generators.py index ffb2e89..ef529c5 100644 --- a/lmproof/candidate_generators.py +++ b/lmproof/candidate_generators.py @@ -96,7 +96,7 @@ def load(cls, language: str) -> "SpellCorrectGenerator": / "frequency_dictionary_en_82_765.txt" ) sym_spell.create_dictionary(str(dict_path)) - spacy_model = spacy.load("en", disable=["parser", "ner"]) + spacy_model = spacy.load("en_core_web_sm", disable=["parser", "ner"]) else: raise RuntimeError(f"The language {language} is currently not language.") return cls(sym_spell, spacy_model) diff --git a/lmproof/scorer.py b/lmproof/scorer.py index 201ded4..7c4634c 100644 --- a/lmproof/scorer.py +++ b/lmproof/scorer.py @@ -1,7 +1,7 @@ from typing import List, Optional +import logging import torch -import logging from torch.nn import CrossEntropyLoss from transformers import ( AutoTokenizer, @@ -25,6 +25,7 @@ def __init__( model: PreTrainedModel, device: str = "cpu", batch_size: int = 1, + add_special_tokens: bool = False, normalize: bool = False, ): # Load pre-trained model tokenizer (vocabulary) @@ -33,6 +34,7 @@ def __init__( self.model = model.to(self.device).eval() self.batch_size = batch_size self.normalize = normalize + self._add_special_tokens = add_special_tokens self._loss_fn = CrossEntropyLoss(ignore_index=-1) @classmethod @@ -58,7 +60,9 @@ def score(self, sentences: List[str]) -> List[Optional[float]]: tokenized_batch = [] for i, sentence in enumerate(batched_sentences): - tokens = self.tokenizer.encode(sentence) + tokens = self.tokenizer.encode( + sentence, add_special_tokens=self._add_special_tokens + ) if len(tokens) <= self.tokenizer.max_len: tokenized_batch.append(torch.LongTensor(tokens)) # type: ignore batch_scored_idx.append(i) diff --git a/poetry.lock b/poetry.lock index 2def1dc..f388dd6 100644 --- a/poetry.lock +++ b/poetry.lock @@ -9,6 +9,7 @@ version = "1.4.3" [[package]] category = "dev" description = "Atomic file writes." +marker = "sys_platform == \"win32\"" name = "atomicwrites" optional = false python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*" @@ -56,10 +57,10 @@ description = "The AWS SDK for Python" name = "boto3" optional = false python-versions = "*" -version = "1.10.16" +version = "1.10.28" [package.dependencies] -botocore = ">=1.13.16,<1.14.0" +botocore = ">=1.13.28,<1.14.0" jmespath = ">=0.7.1,<1.0.0" s3transfer = ">=0.2.0,<0.3.0" @@ -69,7 +70,7 @@ description = "Low-level, data-driven core of boto 3." name = "botocore" optional = false python-versions = "*" -version = "1.13.16" +version = "1.13.28" [package.dependencies] docutils = ">=0.10,<0.16" @@ -83,6 +84,19 @@ version = ">=2.1,<2.8.1" python = ">=3.4" version = ">=1.20,<1.26" +[[package]] +category = "main" +description = "Super lightweight function registries for your library" +name = "catalogue" +optional = false +python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,>=2.7" +version = "0.0.8" + +[package.dependencies] +[package.dependencies.importlib-metadata] +python = "<3.8" +version = ">=0.20" + [[package]] category = "main" description = "Python package for providing Mozilla's CA Bundle." @@ -122,7 +136,7 @@ description = "Manage calls to calloc/free through Cython" name = "cymem" optional = false python-versions = "*" -version = "2.0.2" +version = "2.0.3" [[package]] category = "main" @@ -266,7 +280,7 @@ description = "plugin and hook calling mechanisms for python" name = "pluggy" optional = false python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*" -version = "0.13.0" +version = "0.13.1" [package.dependencies] [package.dependencies.importlib-metadata] @@ -307,7 +321,7 @@ description = "pytest: simple powerful testing with Python" name = "pytest" optional = false python-versions = ">=3.5" -version = "5.2.2" +version = "5.3.1" [package.dependencies] atomicwrites = ">=1.0" @@ -404,10 +418,11 @@ description = "Industrial-strength Natural Language Processing (NLP) in Python" name = "spacy" optional = false python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,>=2.7" -version = "2.2.2" +version = "2.2.3" [package.dependencies] blis = ">=0.4.0,<0.5.0" +catalogue = ">=0.0.7,<1.1.0" cymem = ">=2.0.2,<2.1.0" murmurhash = ">=0.28.0,<1.1.0" numpy = ">=1.15.0" @@ -417,11 +432,7 @@ requests = ">=2.13.0,<3.0.0" setuptools = "*" srsly = ">=0.1.0,<1.1.0" thinc = ">=7.3.0,<7.4.0" -wasabi = ">=0.3.0,<1.1.0" - -[package.dependencies.importlib-metadata] -python = "<3.8" -version = ">=0.20" +wasabi = ">=0.4.0,<1.1.0" [[package]] category = "main" @@ -487,7 +498,7 @@ description = "Fast, Extensible Progress Meter" name = "tqdm" optional = false python-versions = ">=2.6, !=3.0.*, !=3.1.*" -version = "4.38.0" +version = "4.39.0" [[package]] category = "main" @@ -495,7 +506,7 @@ description = "State-of-the-art Natural Language Processing for TensorFlow 2.0 a name = "transformers" optional = false python-versions = "*" -version = "2.1.1" +version = "2.2.0" [package.dependencies] boto3 = "*" @@ -568,13 +579,14 @@ atomicwrites = ["03472c30eb2c5d1ba9227e4c2ca66ab8287fbfbbda3888aa93dc2e28fc6811b attrs = ["08a96c641c3a74e44eb59afb61a24f2cb9f4d7188748e76ba4bb5edfa3cb7d1c", "f7b7ce16570fe9965acd6d30101a28f62fb4a7f9e926b3bbc9b61f8b04247e72"] black = ["1b30e59be925fafc1ee4565e5e08abef6b03fe455102883820fe5ee2e4734e0b", "c2edb73a08e9e0e6f65a0e6af18b059b8b1cdd5bef997d7a0b181df93dc81539"] blis = ["03c368c9716ca814c436550a5f1e02ccf74850e613602519e3941d212e5aa177", "135450caabc8aea9bb9250329ebdf7189982d9b57d5c92789b2ba2fe52c247a7", "1402d9cbb0fbc21b749dd5b87d7ee14249e74a0ca38be6ecc56b3b356fca2f21", "26b16d6005bb2671699831b5cc699905215d1abde1ec5c1d04de7dcd9eb29f75", "3347a4b1b7d3ae14476aac9a6f7bf8ebf464863f4ebf4aea228874a7694ea240", "38fe877a4b52e762f5e137a412e3c256545a696a12ae8c40d67b8815d2bb5097", "4fb89c47ee06b58a4410a16fd5794847517262c9d2a342643475b477dfeff0a4", "77a6486b9794af01bcdfd1bc6e067c93add4b93292e6f95bf6e5ce7f98bf0163", "8aeaf6954351593a1e412f80e398aa51df588d3c0de74b9f3323b694c603381b", "d1d59faebc1c94f8f4f77154ef4b9d6d40364b111cf8fde48ee3b524c85f1075", "d69257d317e86f34a7f230a2fd1f021fd2a1b944137f40d8cdbb23bd334cd0c4", "ddd732c5274d1082fa92e2c42317587d5ebabce7741ca98120f69bd45d004b99", "f0b0dad4d6268d9dba0a65a9db12dd7a2d8686b648399e4aa1aec7550697e99e"] -boto3 = ["8ee908fc84041742384e916401d95dfd25738a8add5726e5020063e34b5aa30b", "fa4954929bdf54b4ab488d37ad29663b453f60e99892a797c7dd1baf3e62a5a8"] -botocore = ["dd295c4ad595c86a0ba4e570f4e5c013a7ea38bbf5e0d250f844e84fb040c14d", "ebb5b74c3f02e8965b47f8aed99e0e35df82e1f29d35b390835971700e82da4d"] +boto3 = ["21a75f1a3f85fbfcc00d691200fbe4aa71f18e98389d88401f38e35ae50825e9", "e4daa659f2aaf5664a32224cbcbbcaa9042ac657f1c64326d0e3230f967c2a30"] +botocore = ["5a343562b52d6216dbda89b8969dcbffa4474c7df9cbe04ee7440033c1c4075b", "9b886c4fc7efe0927ea90a3e070bc7e44dc6b8a1518ece6e99ecb21f52c75831"] +catalogue = ["98a71a99cc65eb26914fd8a3cc3027354337b870c80e9d3dc32e2c95a34e7df0", "c407a51c22f51b0f938104b6396c489145bae234386e68eb1d56326c3b3e128e"] certifi = ["e4f3620cfea4f83eedc95b24abd9cd56f3c4b146dd0177e83a21b4eb49e21e50", "fd7c7c74727ddcf00e9acd26bba8da604ffec95bf1c2144e67aff7a8b50e6cef"] chardet = ["84ab92ed1c4d4f16916e05906b6b75a6c0fb5db821cc65e70cbd64a3e2a5eaae", "fc323ffcaeaed0e0a02bf4d117757b98aed530d9ed4531e3e15460124c106691"] click = ["2335065e6395b9e67ca716de5f7526736bfa6ceead690adf616d925bdc622b13", "5b94b49521f6456670fdb30cd82a4eca9412788a93fa6dd6df72c94d5a8ff2d7"] colorama = ["05eed71e2e327246ad6b38c540c4a3117230b19679b875190486ddd2d721422d", "f8ac84de7840f5b9c4e3347b3c1eaa50f7e49c2b07596221daec5edaabbd7c48"] -cymem = ["081c652ae1aff4759813e93a2fc4df4ba410ce214a0e542988e24c62110d4cd0", "0e447fa4cb6dccd0b96257a798370a17bef3ec254a527230058e41816a777c04", "2c8267dcb15cc6ab318f01ceaf16b8440c0386ae44014d5b22fefe5b0398d05c", "46141111eedbb5b0d8c9386b00226a15f5727a1202b9095f4363d425f259267e", "4994c1f3e948bd58a6e38c905221680563b851983a15f1f01e5ff415d560d153", "584872fd3df176e50c90e37aaca6cb731ac0abcdea4f5b8ad77c30674cfaaa99", "6e3194135b21bb268030f3473beb8b674b356c330a9fa185dced2f5006cbd5ba", "71710ee0e946a6bd33c86dd9e71f95ad584c65e8bb02615f00ceb0d8348fb303", "741957f541fb8322de5a8c711d5d58f80d684225d2aec32fec92484cac931a52", "7f01ba6153427811cd7d35630081c69b32c188a1d330599a826ef3bf17edbd7c", "8d96e95902e781950d7c255b19364a1ed50a204843d63dd386b0abc5e6df5e44", "8dd169ece1629ec4db1a592321e3ae0a9bb62fda2052a351fc36871f314c3569", "8e6ad29636edd559b0dfe0a19c5cb5e6257461a5df90839e8c7710ddb005f4b4", "9935b233882732f03fd0fadbeb9e9aa672edcdd126e6d52c36d60adf1def8ea5", "a38b3229782411e4b23240f5f90000c4e7a834af88ed8763c66f8e4603db6b51", "a5966b3171bad9c84a2b19dccda5ab37ae8437c0709a6b72cb42b64ea76a4bd3", "ab88b1534f06df07262d9bc5efb3ba07948cdbe9a363eb9eaa4ad42fae6c7b5e", "b08b0dd7adafbff9f0fd7dc8dcad5f3ce6f23c126c81ad8d1666880cc94e6974", "ba47b571d480c0b76d282ff1634372070031d4998a46ae5d8305d49563b74ca6", "bf049dc9cf0d3aa4a48ba514b7f1699fb6f35b18ad8c6f018bd13e0bccd9d30c", "c46a122c524a3270ac5249f590ac2f75f1a83692a3d3a03479cea49de72a0a89", "c63337aa7e1ad4ec182cc7847c6d85390589fbbf1f9f67d1fde8133a9acb7fa8", "ec51273ea08a2c6389bc4dd6b5183354826d916b149a041f2f274431166191bc"] +cymem = ["5083b2ab5fe13ced094a82e0df465e2dbbd9b1c013288888035e24fd6eb4ed01", "622c20a57701d02f01a47e856dea248e112638f28c8249dbe3ed95a9702e3d74", "6f4cb689a9552e9e13dccc89203c8ab09f210a7ffb92ce27c384a4a0be27b527", "719f04a11ca709fc2b47868070d79fccff77e5d502ff32de2f4baa73cb16166f", "7236252bed70f37b898933dcf8aa875d0829664a245a272516f27b30439df71c", "7f5ddceb12b73f7fd2e4398266401b6f887003740ccd18c989a2af04500b5f2b", "85b9364e099426bd7f445a7705aad87bf6dbb71d79e3802dd8ca14e181d38a33", "c288a1bbdf58c360457443e5297e74844e1961e5e7001dbcb3a5297a41911a11", "cd21ec48ee70878d46c486e2f7ae94b32bfc6b37c4d27876c5a5a00c4eb75c3c", "d7505c500d994f11662e5595f5002251f572acc189f18944619352e2636f5181", "dd24848fbd75b17bab06408da6c029ba7cc615bd9e4a1f755fb3a090025fb922", "f4f19af4bca81f11922508a9dcf30ce1d2aee4972af9f81ce8e5331a6f46f5e1"] docutils = ["6c4f696463b79f1fb8ba0c594b63840ebd41f059e92b31957c46b74a4599b6d0", "9e4d7ecfc600058e07ba661411a2b7de2fd0fafa17d1a7f7361cd47b1175c827", "a2aeea129088da402665e92e0b25b04b073c04b2dce4ab65caaa38b7ce2e1a99"] future = ["b1bead90b70cf6ec3f0710ae53a525360fa360d306a86583adc6bf83a4db537d"] idna = ["c357b3f628cf53ae2c4c05627ecc484553142ca23264e593d327bcde5e9c3407", "ea8b7f6188e6fa117537c3df7da9fc686d485087abf6ac197f9c46432f7e4a3c"] @@ -590,11 +602,11 @@ numpy = ["0a7a1dd123aecc9f0076934288ceed7fd9a81ba3919f11a855a7887cbe82a02f", "0c packaging = ["28b924174df7a2fa32c1953825ff29c61e2f5e082343165438812f00d3a7fc47", "d9551545c6d761f3def1677baf08ab2a3ca17c56879e70fecba2fc4dde4ed108"] pathspec = ["e285ccc8b0785beadd4c18e5708b12bb8fcf529a1e61215b3feff1d1e559ea5c"] plac = ["398cb947c60c4c25e275e1f1dadf027e7096858fb260b8ece3b33bcff90d985f", "487e553017d419f35add346c4c09707e52fa53f7e7181ce1098ca27620e9ceee"] -pluggy = ["0db4b7601aae1d35b4a033282da476845aa19185c1e6964b25cf324b5e4ec3e6", "fa5fa1622fa6dd5c030e9cad086fa19ef6a0cf6d7a2d12318e10cb49d6d68f34"] +pluggy = ["15b2acde666561e1298d71b523007ed7364de07029219b604cf808bfa1c765b0", "966c145cd83c96502c3c3868f50408687b38434af77734af1e9ca461a4081d2d"] preshed = ["0c15ae62f2595ca479decc3452967484dae57b510278800f5deb9115238cc818", "1be3cb59211282e906a11443464fe3e19f6561e2fcd06410e4adc6d45354cf82", "1ef72a120e49356058b3c0590d7b5e91f2747b44e006eef6579be6131223cab0", "253970beae87ab672a6afb543908761795eea3cb7b0d784e2ea51e265752059e", "448d9df12e63fe4a3024f6153ee6703bb95d2be0ce887b5eda7ddc41acfba825", "61d73468c97c1d6d5a048de0b01d5a6fd052123358aca4823cdb277e436436cb", "633358f1fb0ec5dd6dbe4971c328d08809e5a8dbefdf13a802ae0a7cb45306c7", "6518bbd5fb8adbc3231e75ae78d96a7bdd5405a3b23a09d5e62a2e4fc833724e", "7e80ffc1fb79496d4feafe0eaf71ee5e532b91daf6cec235d7f9c4c12657a58c", "7ea588a78aaf310ae2c293071a8571b07ae434819be05fe510442b6df3f8fbf7", "88427346b220293439db77c82913791fa13edc6ac73d8159610699a3ca17aae9", "8a9a8222a697a513f25a94733e7a17cc298ecd8fd56b606a1d8fa0ac342c2830", "ece5e850f667eaa3367d5c56dda9e3aa6ac1c0bb2117d2f466a26db5f26bbe4b"] py = ["64f65755aee5b381cea27766a3a147c3f15b9b6b9ac88676de66ba2ae36793fa", "dc639b046a6e2cff5bbe40194ad65936d6ba360b52b3c3fe1d08a82dd50b5e53"] pyparsing = ["20f995ecd72f2a1f4bf6b072b63b22e2eb457836601e76d6e5dfcd75436acc1f", "4ca62001be367f01bd3e92ecbb79070272a9d4964dce6a48a82ff0b8bc7e683a"] -pytest = ["27abc3fef618a01bebb1f0d6d303d2816a99aa87a5968ebc32fe971be91eb1e6", "58cee9e09242937e136dbb3dab466116ba20d6b7828c7620f23947f37eb4dae4"] +pytest = ["63344a2e3bce2e4d522fd62b4fdebb647c019f1f9e4ca075debbd13219db4418", "f67403f33b2b1d25a6756184077394167fe5e2f9d8bdaab30707d19ccec35427"] python-dateutil = ["7e6584c74aeed623791615e26efd690f29817a27c73085b78e4bad02493df2fb", "c89805f6f4d64db21ed966fda138f8a5ed7a4fdbc1a8ee329ce1b74e3c74da9e"] regex = ["15454b37c5a278f46f7aa2d9339bda450c300617ca2fca6558d05d870245edc7", "1ad40708c255943a227e778b022c6497c129ad614bb7a2a2f916e12e8a359ee7", "5e00f65cc507d13ab4dfa92c1232d004fa202c1d43a32a13940ab8a5afe2fb96", "604dc563a02a74d70ae1f55208ddc9bfb6d9f470f6d1a5054c4bd5ae58744ab1", "720e34a539a76a1fedcebe4397290604cc2bdf6f81eca44adb9fb2ea071c0c69", "7caf47e4a9ac6ef08cabd3442cc4ca3386db141fb3c8b2a7e202d0470028e910", "7faf534c1841c09d8fefa60ccde7b9903c9b528853ecf41628689793290ca143", "b4e0406d822aa4993ac45072a584d57aa4931cf8288b5455bbf30c1d59dbad59", "c31eaf28c6fe75ea329add0022efeed249e37861c19681960f99bbc7db981fb2", "c7393597191fc2043c744db021643549061e12abe0b3ff5c429d806de7b93b66", "d2b302f8cdd82c8f48e9de749d1d17f85ce9a0f082880b9a4859f66b07037dc6", "e3d8dd0ec0ea280cf89026b0898971f5750a7bd92cb62c51af5a52abd020054a", "ec032cbfed59bd5a4b8eab943c310acfaaa81394e14f44454ad5c9eba4f24a74"] requests = ["11e007a8a2aa0323f5a921e9e6a2d7e4e67d9877e85773fba9ba6419025cbeb4", "9cf5292fcd0f598c671cfc1e0d7d1a7f13bb8085e9a590f48c010551dc6c4b31"] @@ -602,14 +614,14 @@ s3transfer = ["6efc926738a3cd576c2a79725fed9afde92378aa5c6a957e3af010cb019fac9d" sacremoses = ["1e84da95cbdbfc8bbc148c0feb5a4737c5d9757071b79e8c1129e449410e410a"] sentencepiece = ["0014d39669289f7925c55e050932a907fa2199b1404385ddb4a69608f75e5b17", "07a544533bbefec3dda5ef15cd00e9b4b9abb3ed0c82eb4b4c57d5f5fd01180b", "1234b461c7706466368624d4a17661984f310708a61c6915174f9b49214ce001", "2055e1e089f08d25f822ede20d004df64d02789b290d115c20aae86d349afed4", "268bb70d89e6c808086844a96a2f086f3b05a66fc6d3e25e2c50691cb3fd14b1", "4240117d7af47b596b8bbea2a8a09ce9f25ac234027030541f188490ad4f367b", "49973f229728d858f9a97ad5c6f54c897b7dc10eddbd19f350f9870320540728", "4daf9930f5e8882e09b6b1052614ab02e7db40ca83032160d49e7956e447d1f4", "791ea9c0a5425f6dd2be6ea353ada94f53ca0964d96b5bf60d2a8e0b1abdfb5f", "7eac4a9e4c51f6297b451ce670fce104e6f0e74049e304416bdde6e66c2708a6", "8174139eca911fdbeab0fcf5eb5f96341959ccda9d403da7695261f20ec909f5", "845748caaebc2fc3b3292537b98d4c5a31e5f15285f7d061ce1f6c795fe2884e", "877a130c1787e2f210e5d7e317e8606ebdc212a1508101ff1bc155aa2ff51f20", "9d206332f6d03fd3e9be40dbe4c04538d0c4d732c5e6314058c1cec3868ef213", "ac049046d3a970aa9cb48a707a4d9cc8e1fcc060eeab7fcb7d03086b40dff70c", "c1b4a5a93b95dd2ac03f3c099654e418800c1ff8fd7d1691f42bdbe8719ae4d3", "ceb495ea00bf04ac9ee1a16a78a8d29efbac9e4ae4744bb1c11d8911fe7eb2e9", "d194cf7431dd87798963ff998380f1c02ff0f9e380cc922a07926b69e21c4e2b", "df2a04cffe27f1394008e55e75239804c907d9358214ff9d6252b1c3cfa7f4ab", "f664c90a0637f5e0ed87cefb337aeb976fa44f3c59cb0aecbb78ac0688184378", "fdbf04c50f131c36867bde2ae6ff48e1fd5216e43c8087fff1f762b7bf9d229a", "fde644520c9c21ab1ee3e2a93be65ca751c971ccc166f0fce20db7f5da324029"] six = ["1f1b7d42e254082a9db6279deae68afb421ceba6158efa6131de7b3003ee93fd", "30f610279e8b2578cab6db20741130331735c781b56053c59c4076da27f06b66"] -spacy = ["33b9aacddad185d4b5cd2fddbe57375f93a88741e06992670f342a002685fb50", "4a1b47a1af437f43987384cd6d8061f5b3e8985f0f2b323f9644ba8e733e79a4", "6311a3040cd40d890307ef316ce193422b074d1eda20f2c9a5e04cef58f494c6", "643200afff7bdb1631d58eb36d00c8f493bf038ed8ab59fb30ddf7fd3aea36b5", "72419014d91be4e3407e1610a13909d91fd0b989638b1343863318f294dba226", "87e2690274086a4d128c17077d2c887c5bb225490f429204858ea5a19121aebf", "926a7f48011d920e347fa02174421cecffc4d35e68d310e2a8e60fa2732fef9b", "936e1a9adc52d3de07efb1af638c9d19993a4873f0d03038b04f38bf35dc08d0", "a10625ac4d05d94034a0e68c9147a385eb9742ff703e7578f928175ba5e6a470", "a9d7a482fb75ad923fc59a7bb9d0148f571b778880e157f1f399a7fb4073eb5b"] +spacy = ["1d14c9e7d65b2cecd56c566d9ffac8adbcb9ce2cff2274cbfdcf5468cd940e6a", "2cb77315522cc422df7750dac778f13d8079f409b4842cf74a54ffe3b84ee5c6", "3c83c061597b5dc94c939c511d3b72c2971257204f21976afc117a350e8fa92b", "6971359e43841ff9ed87e1af5e87ea74d6fdb01fe54807d3e4c6a2a3798d18a4", "708d25c7212bd20d1268c6559e191d221e88e68e152fb98b82c388d16dfdd3d7", "713811c96396c6bb86a1da2bbbe02d874385e74dde6617a84d61d99e9d2b1105", "7fa02ababbb3762277b81873204d78583008b408ddf6fc0ef977b38d3b462b85", "8d1ce99fc30d634b63b15d98c49b96d6a40b0d2048d5dad0f2bb31d3f6dc5ef0", "9afdec1aeb21dbeccfd4d702f12fe8bab88e4d7cd410785bf17f6b186cbc73e8", "ce7fad73de7aed7ca2ee7c2404c77c72005f67ca95edae6f19f08947fb0f8ab3", "d6a2804c457ce74f0d3bf1f4cdb00cbcd228e9da5f0bdbbbe0a856afe12db37e", "d8791f5f69800d702b8e9457418af2cd29789b82697d17ad66df98922f081d1b"] srsly = ["41f2fe803fe6985eb79982ce5d571b81413adfe2d01dcd470e55c6a0f16e07d8", "6ec70d50d2a63452faf5b7606120310c4a95f2c24d931bd8f5babae9d1d99412", "798010e744469f65b3c492eac77d9b46a47a7bc229428f63e9c1c7445efc1809", "8730016fc5ca49dbaf676a8d02b12b184e909a26e596d51f46a6c71a963de462", "8ffa7deafac1fb961385eff6feed324b5890b42175e1dde2c3e3fab2034756bb", "97e5101d6ff08e5a2ebd83fc31b48c90aad24ba35eb4468f5b7ec56ecd8bdb6b", "9e9a395ea53dbac0b705556246d1a9f8e5fea9ba49bc63ec3d3de05bfbe48735", "aa02e2a62093ef09d7904343ee7381b9c9bab5b4f06960dfbeaa12035d0f0a3e", "c62acffd96b4699820e39fcc47fc5a45ff14432c4665d4112ee08e42aeda047e", "d30074fdb05a739358fef33701315f8247161fbdb52f29fca368d10c2ef23fae", "f2f6a950b801352f596667459839235cf059b39307e4034d7ed68e7dfb497bd6", "f48623820170eff0e2fc79419688a16f5977916548dd0d3a8d0d3fc93a7978ad"] symspellpy = ["884a6496462288576f6ab5d6888f84e406e871031e0c64de1c3aa6c78d5ee35a", "ab1adacd40a616741181121e8927c9c4d43bb961756b97c642ed60dc3960b469"] thinc = ["1dbaec0628040a1f8d66147fadbf7775ad6dfe4c681424b2e20479c1e54dc3c1", "30790a1a496a8a84fe300edf50df50454dbdb625b41b203739fbc03112a4d3b6", "56b67887930df87c28af2cc4d046c6bc3e80ed4ff3e57208a4fb7a348d12a580", "650fbead603bd7e73a61fd2c1b69202ad7a8eb70d4ebe7c5484b8788e828b6e0", "713adad69c108dbdc145276d077c4a80f3df31a39b3fc574782dcb64b1def815", "801f32f6c048de7e9f6d406342080e6348d0bb02beb1412811f9150a26661691", "8833246f1c8b95143c91e310728bf64af8972a9d8653252efa1b4c9036837569", "93cb9d184115a8890321dd7f5d94a0d8235dc2fca54d92a9c1c051234a7af43e", "bad16bcc608ec4d74c680d85aa9bf43cfc776ac12ca3b7e699d7283fd0177bca", "ce81d6b2372057e10f9d7cb505942df67a803f270d69959d44d372e8e3792bb9"] toml = ["229f81c57791a41d65e399fc06bf0848bab550a9dfd5ed66df18ce5f05e73d5c", "235682dd292d5899d361a811df37e04a8828a5b1da3115886b73cf81ebc9100e", "f1db651f9657708513243e61e6cc67d101a39bad662eaa9b5546f789338e07a3"] torch = ["0cec2e13a2e95c24c34f17d437f354ee2a40902e8d515a524556b350e12555dd", "134e8291a97151b1ffeea09cb9ddde5238beb4e6d9dfb66657143d6990bfb865", "31062923ac2e60eac676f6a0ae14702b051c158bbcf7f440eaba266b0defa197", "3b05233481b51bb636cee63dc761bb7f602e198178782ff4159d385d1759608b", "458f1d87e5b7064b2c39e36675d84e163be3143dd2fc806057b7878880c461bc", "72a1c85bffd2154f085bc0a1d378d8a54e55a57d49664b874fe7c949022bf071", "77fd8866c0bf529861ffd850a5dada2190a8d9c5167719fb0cfa89163e23b143", "b6f01d851d1c5989d4a99b50ae0187762b15b7718dcd1a33704b665daa2402f9", "d8e1d904a6193ed14a4fed220b00503b2baa576e71471286d1ebba899c851fae"] -tqdm = ["9de4722323451eb7818deb0161d9d5523465353a6707a9f500d97ee42919b902", "c1d677f3a85fa291b34bdf8f770f877119b9754b32673699653556f85e2c2f13"] -transformers = ["13835931987d50001cdf0c6a158343d822dc4fc99534c67b9e3a74e13ed1f24d", "bc0aee900929ee51ce1ad13e4c00b6b7900177e522ec4b393a2aab10fa02b7bd"] +tqdm = ["5a1f3d58f3eb53264387394387fe23df469d2a3fab98c9e7f99d5c146c119873", "f1a1613fee07cc30a253051617f2a219a785c58877f9f6bfa129446cbaf8b4c1"] +transformers = ["1d322bdb8a046ac40a5656daf5ce1b48422ccbb597ccf68c0f3636b60463b2a7", "cd86ed6e91447f0647ef6e8f0984f6fcd3a95382405e733f8b5c672f368ce84b"] typed-ast = ["1170afa46a3799e18b4c977777ce137bb53c7485379d9706af8a59f2ea1aa161", "18511a0b3e7922276346bcb47e2ef9f38fb90fd31cb9223eed42c85d1312344e", "262c247a82d005e43b5b7f69aff746370538e176131c32dda9cb0f324d27141e", "2b907eb046d049bcd9892e3076c7a6456c93a25bebfe554e931620c90e6a25b0", "354c16e5babd09f5cb0ee000d54cfa38401d8b8891eefa878ac772f827181a3c", "48e5b1e71f25cfdef98b013263a88d7145879fbb2d5185f2a0c79fa7ebbeae47", "4e0b70c6fc4d010f8107726af5fd37921b666f5b31d9331f0bd24ad9a088e631", "630968c5cdee51a11c05a30453f8cd65e0cc1d2ad0d9192819df9978984529f4", "66480f95b8167c9c5c5c87f32cf437d585937970f3fc24386f313a4c97b44e34", "71211d26ffd12d63a83e079ff258ac9d56a1376a25bc80b1cdcdf601b855b90b", "7954560051331d003b4e2b3eb822d9dd2e376fa4f6d98fee32f452f52dd6ebb2", "838997f4310012cf2e1ad3803bce2f3402e9ffb71ded61b5ee22617b3a7f6b6e", "95bd11af7eafc16e829af2d3df510cecfd4387f6453355188342c3e79a2ec87a", "bc6c7d3fa1325a0c6613512a093bc2a2a15aeec350451cbdf9e1d4bffe3e3233", "cc34a6f5b426748a507dd5d1de4c1978f2eb5626d51326e43280941206c209e1", "d755f03c1e4a51e9b24d899561fec4ccaf51f210d52abdf8c07ee2849b212a36", "d7c45933b1bdfaf9f36c579671fec15d25b06c8398f113dab64c18ed1adda01d", "d896919306dd0aa22d0132f62a1b78d11aaf4c9fc5b3410d3c666b818191630a", "fdc1c9bbf79510b76408840e009ed65958feba92a88833cdceecff93ae8fff66", "ffde2fbfad571af120fcbfbbc61c72469e72f550d676c3342492a9dfdefb8f12"] typing-extensions = ["091ecc894d5e908ac75209f10d5b4f118fbdb2eb1ede6a63544054bb1edb41f2", "910f4656f54de5993ad9304959ce9bb903f90aadc7c67a0bef07e678014e892d", "cf8b63fedea4d89bab840ecbb93e75578af28f76f66c35889bd7065f5af88575"] urllib3 = ["06330f386d6e4b195fbfc736b297f58c5a892e4440e54d294d7004e3a9bbea1b", "cc44da8e1145637334317feebd728bd869a35285b93cbb4cca2577da7e62db4f"] diff --git a/pyproject.toml b/pyproject.toml index 101984c..ce9d0a6 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "lmproof" -version = "0.1.1b" +version = "0.2.0" description = "Language model powered proof reader for correcting contextual errors in natural language." authors = ["sai-prasanna "] readme = "README.md"