Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							d81b7be6a2
							
						
					 | 
					
						
						
							
							* Merge train.py
						
						
						
						
						
					 | 
					
						2015-03-26 16:44:41 +01:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0962ffc095
							
						
					 | 
					
						
						
							
							* Fix issue #37: missing check_flag attribute from Token class
						
						
						
						
						
					 | 
					
						2015-03-26 15:06:26 +01:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							a61dacb4e5
							
						
					 | 
					
						
						
							
							* Add tests for new subtree method
						
						
						
						
						
					 | 
					
						2015-03-03 05:41:00 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							47a4371fea
							
						
					 | 
					
						
						
							
							* Upd tokenizer with i.e. tests
						
						
						
						
						
					 | 
					
						2015-02-18 06:37:04 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							9dbc31d72c
							
						
					 | 
					
						
						
							
							* Add test from NSchrading
						
						
						
						
						
					 | 
					
						2015-02-16 11:49:31 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							7572e31f5e
							
						
					 | 
					
						
						
							
							* Pass ownership of C data to Token instances if Tokens object is being garbage-collected, but Token instances are staying alive.
						
						
						
						
						
					 | 
					
						2015-02-11 18:05:06 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								leofidus
							
						 
					 | 
					
						
						
						
						
							
						
						
							363473aeed
							
						
					 | 
					
						
						
							
							Add rokenizer test for zero length string
						
						
						
						
						
					 | 
					
						2015-02-10 08:20:32 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							99f0a315f9
							
						
					 | 
					
						
						
							
							* Add test for Issue 24
						
						
						
						
						
					 | 
					
						2015-02-08 18:30:46 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							3e8c87af1a
							
						
					 | 
					
						
						
							
							* Extend parse tree navigation tests
						
						
						
						
						
					 | 
					
						2015-02-07 18:28:45 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							aadc57ab00
							
						
					 | 
					
						
						
							
							* Add tests for tokens api
						
						
						
						
						
					 | 
					
						2015-02-07 13:14:07 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							6b68607b1f
							
						
					 | 
					
						
						
							
							* Add some tests for the code in the index.html docstrings
						
						
						
						
						
					 | 
					
						2015-02-07 08:52:13 -05:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							7d9d8c1489
							
						
					 | 
					
						
						
							
							* Fix test_tag_names again
						
						
						
						
						
					 | 
					
						2015-02-01 16:25:03 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							d1c9e7ff70
							
						
					 | 
					
						
						
							
							* Make test_tag_names version-portable
						
						
						
						
						
					 | 
					
						2015-02-01 15:40:20 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							1f31774078
							
						
					 | 
					
						
						
							
							* Python3 fix for test_tag_names
						
						
						
						
						
					 | 
					
						2015-02-01 13:14:20 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0fd4a71bed
							
						
					 | 
					
						
						
							
							* Add provisional tests for sentence boundary detection
						
						
						
						
						
					 | 
					
						2015-01-31 13:46:11 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							2da694f65e
							
						
					 | 
					
						
						
							
							* Don't load parser in test_pre_punct
						
						
						
						
						
					 | 
					
						2015-01-30 20:11:47 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0b53fd7daa
							
						
					 | 
					
						
						
							
							* Add test for parse tree navigation
						
						
						
						
						
					 | 
					
						2015-01-30 18:02:58 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							7d432b7e39
							
						
					 | 
					
						
						
							
							* Add tests for vector-space model
						
						
						
						
						
					 | 
					
						2015-01-30 16:45:45 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							48b98e3fb5
							
						
					 | 
					
						
						
							
							* Add test for tag names
						
						
						
						
						
					 | 
					
						2015-01-30 16:45:11 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							613a195f92
							
						
					 | 
					
						
						
							
							* Add test for indices
						
						
						
						
						
					 | 
					
						2015-01-30 16:44:29 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							03cc2ee08e
							
						
					 | 
					
						
						
							
							* Add test for numpy array transport
						
						
						
						
						
					 | 
					
						2015-01-30 16:43:55 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							b3f9b199cf
							
						
					 | 
					
						
						
							
							Merge branch 'punctparse'
						
						
						
						
						
					 | 
					
						2015-01-30 16:38:56 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							d0e08a5b57
							
						
					 | 
					
						
						
							
							* Upd index tests
						
						
						
						
						
					 | 
					
						2015-01-30 12:35:13 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							35a18250cc
							
						
					 | 
					
						
						
							
							* Upd tests, avoiding unnecessary processing to make testing faster
						
						
						
						
						
					 | 
					
						2015-01-30 10:41:55 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							bda5347c5c
							
						
					 | 
					
						
						
							
							* Fix unicode in test
						
						
						
						
						
					 | 
					
						2015-01-25 19:04:23 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							706305ee26
							
						
					 | 
					
						
						
							
							* Upd tests for new meaning of 'string'
						
						
						
						
						
					 | 
					
						2015-01-24 07:22:30 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							5ed8b2b98f
							
						
					 | 
					
						
						
							
							* Rename sic to orth
						
						
						
						
						
					 | 
					
						2015-01-23 02:08:25 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							93d4bd6c2e
							
						
					 | 
					
						
						
							
							* Add test for ). in tokenizer
						
						
						
						
						
					 | 
					
						2015-01-22 22:25:18 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							06e7456c65
							
						
					 | 
					
						
						
							
							* Upd tests
						
						
						
						
						
					 | 
					
						2015-01-17 17:33:23 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							802867e96a
							
						
					 | 
					
						
						
							
							* Revise interface to Token. Strings now have attribute names like norm1_
						
						
						
						
						
					 | 
					
						2015-01-15 03:51:47 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							7d3c40de7d
							
						
					 | 
					
						
						
							
							* Tests passing after refactor. API has obvious warts, particularly in Token and Lexeme
						
						
						
						
						
					 | 
					
						2015-01-15 00:33:16 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							dc681920bc
							
						
					 | 
					
						
						
							
							* Upd asciify test, fixing type error
						
						
						
						
						
					 | 
					
						2015-01-06 01:09:44 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							64f33a8705
							
						
					 | 
					
						
						
							
							* Upd asciify test, fixing type error
						
						
						
						
						
					 | 
					
						2015-01-06 01:03:29 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0aa9860c2d
							
						
					 | 
					
						
						
							
							* Fix string-typing in test_contractions. API is inconsistent, must fix...
						
						
						
						
						
					 | 
					
						2015-01-05 20:10:03 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							ee3a71862e
							
						
					 | 
					
						
						
							
							* Fix unicode bugs in tests
						
						
						
						
						
					 | 
					
						2015-01-05 17:54:54 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							166c09832f
							
						
					 | 
					
						
						
							
							* Upd test for Python3
						
						
						
						
						
					 | 
					
						2015-01-05 13:15:46 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							775a66e2b6
							
						
					 | 
					
						
						
							
							* Fix encoding in lemmatizer tests
						
						
						
						
						
					 | 
					
						2015-01-05 11:53:30 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							33b7b3182a
							
						
					 | 
					
						
						
							
							* Relax lemma test for now
						
						
						
						
						
					 | 
					
						2015-01-04 01:16:18 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							5d7e6e37ea
							
						
					 | 
					
						
						
							
							* Refine lemma test to probe failure
						
						
						
						
						
					 | 
					
						2015-01-03 23:41:16 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							4a5cb20899
							
						
					 | 
					
						
						
							
							* Upd test given new data file layout
						
						
						
						
						
					 | 
					
						2015-01-03 01:59:56 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							81d878beb2
							
						
					 | 
					
						
						
							
							* Upd tests
						
						
						
						
						
					 | 
					
						2014-12-30 21:34:09 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							91a5064b7f
							
						
					 | 
					
						
						
							
							* Upd tests
						
						
						
						
						
					 | 
					
						2014-12-26 14:26:27 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							b00bc01d8c
							
						
					 | 
					
						
						
							
							* All tests now passing for reorg
						
						
						
						
						
					 | 
					
						2014-12-23 13:18:59 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							73f200436f
							
						
					 | 
					
						
						
							
							* Tests passing except for morphology/lemmatization stuff
						
						
						
						
						
					 | 
					
						2014-12-23 11:40:32 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							cf8d26c3d2
							
						
					 | 
					
						
						
							
							* POS tagger training working after reorg
						
						
						
						
						
					 | 
					
						2014-12-22 08:54:47 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							4d4d2c0db4
							
						
					 | 
					
						
						
							
							* Upd test
						
						
						
						
						
					 | 
					
						2014-12-21 21:05:28 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							d047dc0d0f
							
						
					 | 
					
						
						
							
							Upd lemmatizer test
						
						
						
						
						
					 | 
					
						2014-12-21 21:02:44 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							b864f0e539
							
						
					 | 
					
						
						
							
							* Upd iteration test
						
						
						
						
						
					 | 
					
						2014-12-21 21:01:46 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							c1ab134159
							
						
					 | 
					
						
						
							
							* Upd lemmas test
						
						
						
						
						
					 | 
					
						2014-12-21 20:58:21 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							82bd57c76f
							
						
					 | 
					
						
						
							
							* Upd intern test
						
						
						
						
						
					 | 
					
						2014-12-21 20:44:21 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							734d1da55c
							
						
					 | 
					
						
						
							
							* Upd emoticons test
						
						
						
						
						
					 | 
					
						2014-12-21 20:43:27 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							199025609f
							
						
					 | 
					
						
						
							
							* Upd contractions test
						
						
						
						
						
					 | 
					
						2014-12-21 20:41:13 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0d9972f4b0
							
						
					 | 
					
						
						
							
							* Upd tokenizer test
						
						
						
						
						
					 | 
					
						2014-12-21 20:38:27 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							ed2fff6128
							
						
					 | 
					
						
						
							
							* Add tests
						
						
						
						
						
					 | 
					
						2014-12-20 03:51:25 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							516f0f1e14
							
						
					 | 
					
						
						
							
							* Remove test for loading ad hoc rules format
						
						
						
						
						
					 | 
					
						2014-12-09 16:08:45 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							6369835306
							
						
					 | 
					
						
						
							
							* Add false positive test for emoticons
						
						
						
						
						
					 | 
					
						2014-12-09 16:08:17 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							2a6bd2818f
							
						
					 | 
					
						
						
							
							* Load the lexicon before we check flag values
						
						
						
						
						
					 | 
					
						2014-12-09 15:18:43 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							302e09018b
							
						
					 | 
					
						
						
							
							* Work on fixing special-cases, reading them in as JSON objects so that they can specify lemmas
						
						
						
						
						
					 | 
					
						2014-12-09 14:48:01 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							cda9ea9a4a
							
						
					 | 
					
						
						
							
							* Add test to make sure iterating over the lexicon isnt broken
						
						
						
						
						
					 | 
					
						2014-12-08 21:12:51 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							7b68f911cf
							
						
					 | 
					
						
						
							
							* Add WordNet lemmatizer
						
						
						
						
						
					 | 
					
						2014-12-08 01:39:13 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							8f2f319c57
							
						
					 | 
					
						
						
							
							* Add a couple more contractions tests
						
						
						
						
						
					 | 
					
						2014-12-07 22:08:04 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							14097311ae
							
						
					 | 
					
						
						
							
							* Make StringStore.__getitem__ accept unicode-typed keys.
						
						
						
						
						
					 | 
					
						2014-12-03 01:33:20 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							60c1e78596
							
						
					 | 
					
						
						
							
							* Commit outstanding tests
						
						
						
						
						
					 | 
					
						2014-11-12 23:24:32 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							b01604b303
							
						
					 | 
					
						
						
							
							* Upd NER tests
						
						
						
						
						
					 | 
					
						2014-11-11 21:10:04 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							10e9e14c4f
							
						
					 | 
					
						
						
							
							* Add tests for NER oracle
						
						
						
						
						
					 | 
					
						2014-11-10 22:13:46 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							d7b2843643
							
						
					 | 
					
						
						
							
							* Add some tests for ner
						
						
						
						
						
					 | 
					
						2014-11-10 16:29:19 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							a42321bd4e
							
						
					 | 
					
						
						
							
							* Upd shape test
						
						
						
						
						
					 | 
					
						2014-11-07 04:42:54 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							81da61f3cf
							
						
					 | 
					
						
						
							
							* Remove out-dated POS data test
						
						
						
						
						
					 | 
					
						2014-11-05 02:04:12 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0de700b566
							
						
					 | 
					
						
						
							
							* Comment out tests of hyphenation, while we decide what hyphenation policy should be.
						
						
						
						
						
					 | 
					
						2014-11-05 02:03:22 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							11915e5238
							
						
					 | 
					
						
						
							
							* Update tests
						
						
						
						
						
					 | 
					
						2014-11-03 00:23:04 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							493d5ffb50
							
						
					 | 
					
						
						
							
							* Add test for '' in punct
						
						
						
						
						
					 | 
					
						2014-11-02 21:24:09 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							99b5cefa88
							
						
					 | 
					
						
						
							
							* Add tests for emoticon tokenization
						
						
						
						
						
					 | 
					
						2014-11-02 13:22:14 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							23131f21bb
							
						
					 | 
					
						
						
							
							* Add tests for like_url
						
						
						
						
						
					 | 
					
						2014-11-02 13:21:57 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							dc6c3c0f56
							
						
					 | 
					
						
						
							
							* Add tests for like_number
						
						
						
						
						
					 | 
					
						2014-11-02 13:21:39 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							c414d0eebe
							
						
					 | 
					
						
						
							
							* Add tests for is_number
						
						
						
						
						
					 | 
					
						2014-11-01 19:13:40 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							63114820cf
							
						
					 | 
					
						
						
							
							* Upd tests for tighter interface
						
						
						
						
						
					 | 
					
						2014-10-30 18:15:30 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							13909a2e24
							
						
					 | 
					
						
						
							
							* Rewriting Lexeme serialization.
						
						
						
						
						
					 | 
					
						2014-10-29 23:19:38 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							08ce602243
							
						
					 | 
					
						
						
							
							* Large refactor, particularly to Python API
						
						
						
						
						
					 | 
					
						2014-10-24 00:59:17 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							168b2b8cb2
							
						
					 | 
					
						
						
							
							* Add tests for string intern
						
						
						
						
						
					 | 
					
						2014-10-23 20:47:06 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							077885637d
							
						
					 | 
					
						
						
							
							* Add test for reading in POS tags
						
						
						
						
						
					 | 
					
						2014-10-22 10:18:43 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							12742f4f83
							
						
					 | 
					
						
						
							
							* Add detokenize method and test
						
						
						
						
						
					 | 
					
						2014-10-18 18:07:29 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							31aad7c08a
							
						
					 | 
					
						
						
							
							* Test hyphenation etc
						
						
						
						
						
					 | 
					
						2014-10-14 20:26:16 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							99f5e59286
							
						
					 | 
					
						
						
							
							* Have tokenizer emit tokens for whitespace other than single spaces
						
						
						
						
						
					 | 
					
						2014-10-14 20:25:57 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							6fb42c4919
							
						
					 | 
					
						
						
							
							* Add offsets to Tokens class. Some changes to interfaces, and reorganization of spacy.Lang
						
						
						
						
						
					 | 
					
						2014-10-14 16:17:45 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							59b41a9fd3
							
						
					 | 
					
						
						
							
							* Switch to new data model, tests passing
						
						
						
						
						
					 | 
					
						2014-10-10 08:11:31 +11:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							bc460de171
							
						
					 | 
					
						
						
							
							* Add extra tests
						
						
						
						
						
					 | 
					
						2014-09-25 18:29:42 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							2d4e5ceafd
							
						
					 | 
					
						
						
							
							* Remove old docs stuff
						
						
						
						
						
					 | 
					
						2014-09-25 18:24:05 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0152831c89
							
						
					 | 
					
						
						
							
							* Refactor tokenization, enable cache, and ensure we look up specials correctly even when there's confusing punctuation surrounding the token.
						
						
						
						
						
					 | 
					
						2014-09-16 18:01:46 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							db191361ee
							
						
					 | 
					
						
						
							
							* Add new tests for fancier tokenization cases
						
						
						
						
						
					 | 
					
						2014-09-15 06:31:58 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							5dcc1a426a
							
						
					 | 
					
						
						
							
							* Update tokenization tests for new tokenizer rules
						
						
						
						
						
					 | 
					
						2014-09-15 01:32:51 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							0447279c57
							
						
					 | 
					
						
						
							
							* PointerHash working, efficiency is good. 6-7 mins
						
						
						
						
						
					 | 
					
						2014-09-13 16:43:59 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							985bc68327
							
						
					 | 
					
						
						
							
							* Fix bug with trailing punct on contractions. Reduced efficiency, and slightly hacky implementation.
						
						
						
						
						
					 | 
					
						2014-09-12 18:26:26 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							b5b31c6b6e
							
						
					 | 
					
						
						
							
							* Avoid testing for object identity
						
						
						
						
						
					 | 
					
						2014-09-10 20:58:30 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							7c09c73a14
							
						
					 | 
					
						
						
							
							* Refactor to use tokens class.
						
						
						
						
						
					 | 
					
						2014-09-10 18:27:44 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							5ee4d8c641
							
						
					 | 
					
						
						
							
							* Work on tests for flag features
						
						
						
						
						
					 | 
					
						2014-09-01 23:41:43 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							bf47429368
							
						
					 | 
					
						
						
							
							* Add tests for non_sparse string transform
						
						
						
						
						
					 | 
					
						2014-09-01 23:27:31 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							c50433163f
							
						
					 | 
					
						
						
							
							* Add tests for flag features
						
						
						
						
						
					 | 
					
						2014-09-01 23:27:09 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							786a4a86fe
							
						
					 | 
					
						
						
							
							* Add tests for canon_case
						
						
						
						
						
					 | 
					
						2014-09-01 23:26:49 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							4c7b997df7
							
						
					 | 
					
						
						
							
							* Add tests for word shape features
						
						
						
						
						
					 | 
					
						2014-09-01 23:26:17 +02:00 | 
					
					
						
						
							
							
							
						
					 | 
				
			
				
					
						
							
							
								 
								Matthew Honnibal
							
						 
					 | 
					
						
						
						
						
							
						
						
							c5abb81f4c
							
						
					 | 
					
						
						
							
							* Add incomplete tests of asciify function
						
						
						
						
						
					 | 
					
						2014-09-01 23:25:51 +02:00 | 
					
					
						
						
							
							
							
						
					 |