Update spaCy pipeline

429e275 verified 5 months ago

16.3 kB

	[
	"\t",
	"\n",
	"\r",
	" ",
	" ",
	"\"",
	"'",
	"''",
	"'-(",
	"'-)",
	"'Cause",
	"'Cos",
	"'Coz",
	"'Cuz",
	"'S",
	"'X",
	"'Xxx",
	"'Xxxxx",
	"'am",
	"'bout",
	"'cause",
	"'cos",
	"'coz",
	"'cuz",
	"'d",
	"'em",
	"'ll",
	"'m",
	"'nuff",
	"'re",
	"'s",
	"'ve",
	"'x",
	"'xx",
	"'xxx",
	"'xxxx",
	"'y",
	"(",
	"(((",
	"(*>",
	"(_)",
	"(-8",
	"(-:",
	"(-;",
	"(-_-)",
	"(-d",
	"(._.)",
	"(:",
	"(;",
	"(=",
	"(>_<)",
	"(^_^)",
	"(o:",
	"(x:",
	"(x_x)",
	"(\u00ac_\u00ac)",
	"(\u0ca0_\u0ca0)",
	"(\u256f\u00b0\u25a1\u00b0\uff09\u256f\ufe35\u253b\u2501\u253b",
	")",
	")))",
	")-:",
	")/\u00af",
	"):",
	"*",
	",",
	"-",
	"-((",
	"-))",
	"-/",
	"-0",
	"-3",
	"-8",
	"-D",
	"-O",
	"-P",
	"-X",
	"-_-",
	"-__-",
	"-d",
	"-o",
	"-p",
	"-x",
	"-\|",
	".",
	".C.",
	".D.",
	".E.",
	".G.",
	".H.",
	".J.",
	".M.",
	".Y.",
	"._.",
	".e.",
	".g.",
	".m.",
	".s.",
	"/",
	"/3",
	"/d",
	"/or",
	"0",
	"0.0",
	"0.o",
	"0_0",
	"0_o",
	"1",
	"10",
	"10a.m",
	"10a.m.",
	"10p.m",
	"10p.m.",
	"11",
	"11a.m",
	"11a.m.",
	"11p.m",
	"11p.m.",
	"12",
	"123456",
	"12a.m",
	"12a.m.",
	"12p.m",
	"12p.m.",
	"1a.m",
	"1a.m.",
	"1p.m",
	"1p.m.",
	"2",
	"2a.m",
	"2a.m.",
	"2p.m",
	"2p.m.",
	"3",
	"321",
	"33",
	"333",
	"3a.m",
	"3a.m.",
	"3p.m",
	"3p.m.",
	"4",
	"456",
	"4a.m",
	"4a.m.",
	"4p.m",
	"4p.m.",
	"5",
	"5a.m",
	"5a.m.",
	"5p.m",
	"5p.m.",
	"6",
	"654",
	"654321",
	"6a.m",
	"6a.m.",
	"6p.m",
	"6p.m.",
	"7",
	"7a.m",
	"7a.m.",
	"7p.m",
	"7p.m.",
	"8",
	"8)",
	"8-",
	"8-)",
	"8-D",
	"8-d",
	"8D",
	"8a.m",
	"8a.m.",
	"8d",
	"8p.m",
	"8p.m.",
	"9",
	"987654",
	"9a.m",
	"9a.m.",
	"9p.m",
	"9p.m.",
	":",
	":'(",
	":')",
	":'-(",
	":'-)",
	":(",
	":((",
	":(((",
	":()",
	":)",
	":))",
	":)))",
	":*",
	":-(",
	":-((",
	":-(((",
	":-)",
	":-))",
	":-)))",
	":-*",
	":-/",
	":-0",
	":-3",
	":->",
	":-D",
	":-O",
	":-P",
	":-X",
	":-]",
	":-d",
	":-o",
	":-p",
	":-x",
	":-\|",
	":-}",
	":/",
	":0",
	":1",
	":3",
	":>",
	":D",
	":O",
	":P",
	":X",
	":]",
	":d",
	":o",
	":o)",
	":p",
	":x",
	":x)",
	":\|",
	":}",
	":\u2019(",
	":\u2019)",
	":\u2019-(",
	":\u2019-)",
	";",
	";)",
	";-)",
	";-D",
	";-X",
	";-d",
	";D",
	";X",
	";_;",
	";d",
	"<",
	"<.<",
	"</3",
	"</d",
	"<3",
	"<33",
	"<333",
	"<d",
	"<dd",
	"<ddd",
	"<space>",
	"<xxxx>",
	"=",
	"=(",
	"=)",
	"=/",
	"=3",
	"=D",
	"=X",
	"=[",
	"=]",
	"=d",
	"=\|",
	">",
	">.<",
	">.>",
	">:(",
	">:o",
	">:x",
	"><(((*>",
	"?",
	"@",
	"@_@",
	"A",
	"ADY",
	"AGREE",
	"ALLERGY",
	"AME",
	"ANTIBIOTIC",
	"Abreu",
	"Adm",
	"Adm.",
	"Agree",
	"Ai",
	"Ak",
	"Ak.",
	"Ala",
	"Ala.",
	"Alabama",
	"Alaska",
	"Andres",
	"Antibiotic",
	"Antibiotics",
	"Any",
	"Apr",
	"Apr.",
	"April",
	"Are",
	"Ariz",
	"Ariz.",
	"Arizona",
	"Ark",
	"Ark.",
	"Arkansas",
	"Aug",
	"Aug.",
	"August",
	"B",
	"BETA-BLOCKERS",
	"BLOOD LOSS",
	"Beta",
	"Bros",
	"Bros.",
	"Brown",
	"C",
	"C'm",
	"C++",
	"C.",
	"CDs",
	"CONSENT",
	"Ca",
	"Calif",
	"Calif.",
	"California",
	"Can",
	"Cause",
	"Co",
	"Co.",
	"Colo",
	"Colo.",
	"Colorado",
	"Conn",
	"Conn.",
	"Connecticut",
	"Corp",
	"Corp.",
	"Cos",
	"Could",
	"Coz",
	"Cuz",
	"C\u2019m",
	"D",
	"D.",
	"D.C.",
	"DURATION",
	"Dare",
	"Dec",
	"Dec.",
	"December",
	"Del",
	"Del.",
	"Delaware",
	"Did",
	"Do",
	"Does",
	"Doin",
	"Doin'",
	"Doin\u2019",
	"Dr",
	"Dr.",
	"E",
	"E.G.",
	"E.g",
	"E.g.",
	"ENT",
	"ERS",
	"Emil",
	"F",
	"F.",
	"FIRE RISK",
	"Farah",
	"Feb",
	"Feb.",
	"February",
	"Fire",
	"Fla",
	"Fla.",
	"Florida",
	"G",
	"GREETING",
	"Ga",
	"Ga.",
	"Gen",
	"Gen.",
	"Georgia",
	"Goin",
	"Goin'",
	"Goin\u2019",
	"Gon",
	"Good",
	"Got",
	"Gov",
	"Gov.",
	"Greetings",
	"H",
	"Had",
	"Has",
	"Have",
	"Havin",
	"Havin'",
	"Havin\u2019",
	"He",
	"He's",
	"Here",
	"Hey",
	"He\u2019s",
	"Hi",
	"How",
	"How's",
	"How\u2019s",
	"I",
	"I.E.",
	"I.e",
	"I.e.",
	"ING",
	"ION",
	"ISK",
	"Ia",
	"Ia.",
	"Id",
	"Id.",
	"Idaho",
	"Ill",
	"Ill.",
	"Illinois",
	"Inc",
	"Inc.",
	"Ind",
	"Ind.",
	"Indiana",
	"Iowa",
	"Is",
	"It",
	"It's",
	"It\u2019s",
	"J",
	"Jan",
	"Jan.",
	"January",
	"Johnson",
	"Jr",
	"Jr.",
	"Jul",
	"Jul.",
	"July",
	"Jun",
	"Jun.",
	"June",
	"K",
	"K.",
	"Kan",
	"Kan.",
	"Kans",
	"Kans.",
	"Kansas",
	"Kentucky",
	"Ky",
	"Ky.",
	"L",
	"La",
	"La.",
	"Let",
	"Let's",
	"Let\u2019s",
	"Lexi",
	"Louisiana",
	"Lovin",
	"Lovin'",
	"Lovin\u2019",
	"Ltd",
	"Ltd.",
	"M",
	"MEDICAL_PROCEDURE",
	"MEDICAL_ROLE",
	"MEDS/EQUIPMENT",
	"MEN",
	"MRN",
	"Ma'am",
	"Mar",
	"Mar.",
	"March",
	"Marking",
	"Mass",
	"Mass.",
	"Massachusetts",
	"May",
	"Ma\u2019am",
	"Md",
	"Md.",
	"Messrs",
	"Messrs.",
	"Mich",
	"Mich.",
	"Michigan",
	"Might",
	"Minn",
	"Minn.",
	"Minnesota",
	"Miss",
	"Miss.",
	"Mississippi",
	"Mo",
	"Mo.",
	"Mont",
	"Mont.",
	"Mount",
	"Mr",
	"Mr.",
	"Mrs",
	"Mrs.",
	"Ms",
	"Ms.",
	"Mt",
	"Mt.",
	"Must",
	"My",
	"N",
	"N.C.",
	"N.D.",
	"N.H.",
	"N.J.",
	"N.M.",
	"N.Y.",
	"NAME",
	"Neb",
	"Neb.",
	"Nebr",
	"Nebr.",
	"Nebraska",
	"Need",
	"Nev",
	"Nev.",
	"Nevada",
	"New Hampshire",
	"New Jersey",
	"New Mexico",
	"New York",
	"No",
	"North Carolina",
	"North Dakota",
	"Not",
	"Nothin",
	"Nothin'",
	"Nothin\u2019",
	"Nov",
	"Nov.",
	"November",
	"Nurse",
	"Nuthin",
	"Nuthin'",
	"Nuthin\u2019",
	"O",
	"O'clock",
	"O.O",
	"O.o",
	"OGY",
	"OLE",
	"OSS",
	"O_O",
	"O_o",
	"Oct",
	"Oct.",
	"October",
	"Okla",
	"Okla.",
	"Oklahoma",
	"Ol",
	"Ol'",
	"Ol\u2019",
	"Ore",
	"Ore.",
	"Oregon",
	"Ought",
	"O\u2019clock",
	"P",
	"POSITION",
	"Pa",
	"Pa.",
	"Patient",
	"Pennsylvania",
	"Ph",
	"Ph.D.",
	"Prof",
	"Prof.",
	"R",
	"RADIOLOGY",
	"READY",
	"REE",
	"RGY",
	"ROOT",
	"Radiology",
	"Ready",
	"Rep",
	"Rep.",
	"Rev",
	"Rev.",
	"S",
	"S.C.",
	"SCDs",
	"SITES",
	"SPECIMEN",
	"Scrub",
	"Sen",
	"Sen.",
	"Sep",
	"Sep.",
	"Sept",
	"Sept.",
	"September",
	"Sha",
	"She",
	"She's",
	"She\u2019s",
	"Should",
	"Sites",
	"Smith",
	"Somethin",
	"Somethin'",
	"Somethin\u2019",
	"South Carolina",
	"St",
	"St.",
	"T",
	"TES",
	"TIC",
	"Tech",
	"Technician",
	"Tenn",
	"Tenn.",
	"Tennessee",
	"Thank",
	"That",
	"That's",
	"That\u2019s",
	"The",
	"There",
	"There's",
	"There\u2019s",
	"These",
	"They",
	"This",
	"This's",
	"This\u2019s",
	"Those",
	"URE",
	"V",
	"V.V",
	"V_V",
	"Va",
	"Va.",
	"Virginia",
	"W",
	"Was",
	"Wash",
	"Wash.",
	"Washington",
	"We",
	"Were",
	"What",
	"What's",
	"What\u2019s",
	"When",
	"When's",
	"When\u2019s",
	"Where",
	"Where's",
	"Where\u2019s",
	"Who",
	"Who's",
	"Who\u2019s",
	"Why",
	"Why's",
	"Why\u2019s",
	"Wis",
	"Wis.",
	"Wisconsin",
	"Wo",
	"Would",
	"X'x",
	"X'xxxx",
	"X++",
	"X.",
	"X.X",
	"X.X.",
	"X.x",
	"X.x.",
	"XD",
	"XDD",
	"XX",
	"XXX",
	"XXXX",
	"XXXX XXXX",
	"XXXX-XXXX",
	"XXXX/XXXX",
	"XXXX_XXXX",
	"XXXx",
	"X_X",
	"X_x",
	"Xx",
	"Xx'",
	"Xx'x",
	"Xx'xx",
	"Xx.",
	"Xx.X.",
	"Xxx",
	"Xxx'x",
	"Xxx.",
	"Xxxx",
	"Xxxx'",
	"Xxxx'x",
	"Xxxx.",
	"Xxxxx",
	"Xxxxx'",
	"Xxxxx'x",
	"Xxxxx.",
	"Xxxxx\u2019",
	"Xxxxx\u2019x",
	"Xxxx\u2019",
	"Xxxx\u2019x",
	"Xxx\u2019x",
	"Xx\u2019",
	"Xx\u2019x",
	"Xx\u2019xx",
	"X\u2019x",
	"X\u2019xxxx",
	"Y",
	"Yes",
	"You",
	"[",
	"[-:",
	"[:",
	"[=",
	"\\",
	"\\\")",
	"\\n",
	"\\t",
	"\\x",
	"]",
	"]=",
	"^",
	"^_^",
	"^__^",
	"^___^",
	"_*)",
	"_-)",
	"_.)",
	"_<)",
	"_^)",
	"__-",
	"__^",
	"_\u00ac)",
	"_\u0ca0)",
	"a",
	"a.",
	"a.m",
	"a.m.",
	"about",
	"abreu",
	"ace",
	"add",
	"adm",
	"adm.",
	"ady",
	"aft",
	"afternoon",
	"agree",
	"ai",
	"ak",
	"ak.",
	"ala",
	"ala.",
	"all",
	"allergies",
	"allergy",
	"am",
	"ame",
	"an",
	"an.",
	"and",
	"and/or",
	"andres",
	"anesthesiologist",
	"ank",
	"ans",
	"antibiotic",
	"antibiotics",
	"any",
	"anything",
	"applied",
	"apr",
	"apr.",
	"ar.",
	"are",
	"ariz",
	"ariz.",
	"ark",
	"ark.",
	"art",
	"artery",
	"ary",
	"ash",
	"ass",
	"at",
	"aug",
	"aug.",
	"ave",
	"b",
	"b.",
	"bear",
	"because",
	"been",
	"beta",
	"beta-blockers",
	"blanket",
	"blockers",
	"blood",
	"blood loss",
	"bout",
	"br.",
	"bros",
	"bros.",
	"brown",
	"bypass",
	"c",
	"c'm",
	"c++",
	"c.",
	"ca",
	"calif",
	"calif.",
	"can",
	"cardiothoracic",
	"cause",
	"cds",
	"ce>",
	"ces",
	"ch.",
	"cholecystectomy",
	"cic",
	"co",
	"co.",
	"colo",
	"colo.",
	"come",
	"completed",
	"compression",
	"confirmed",
	"conn",
	"conn.",
	"consent",
	"cord",
	"coronary",
	"corp",
	"corp.",
	"cos",
	"could",
	"coz",
	"ct.",
	"cts",
	"cuz",
	"c\u2019m",
	"d",
	"d)",
	"d-",
	"d-)",
	"d-X",
	"d.",
	"d.c.",
	"d.d",
	"d.x",
	"dX",
	"d_d",
	"d_x",
	"dare",
	"dby",
	"dd",
	"ddd",
	"dddd",
	"ddx.x",
	"ddx.x.",
	"dec",
	"dec.",
	"decompressive",
	"del",
	"del.",
	"der",
	"devices",
	"did",
	"dm.",
	"do",
	"does",
	"doin",
	"doin'",
	"doing",
	"doin\u2019",
	"dr",
	"dr.",
	"duration",
	"dx.x",
	"dx.x.",
	"e",
	"e's",
	"e.",
	"e.g",
	"e.g.",
	"ear",
	"eb.",
	"ebr",
	"ec.",
	"ech",
	"ect",
	"eed",
	"een",
	"ein",
	"el.",
	"em",
	"emil",
	"en",
	"en.",
	"enn",
	"enough",
	"ent",
	"eon",
	"ep.",
	"ept",
	"ere",
	"ers",
	"ery",
	"ese",
	"est",
	"eta",
	"ev.",
	"eve",
	"evening",
	"everybody",
	"everyone",
	"exi",
	"expect",
	"expected",
	"e\u2019s",
	"f",
	"f.",
	"farah",
	"feb",
	"feb.",
	"fire",
	"fire risk",
	"fla",
	"fla.",
	"for",
	"four",
	"g",
	"g.",
	"ga",
	"ga.",
	"gallbladder",
	"gen",
	"gen.",
	"ght",
	"goin",
	"goin'",
	"going",
	"goin\u2019",
	"gon",
	"gonna",
	"good",
	"got",
	"gov",
	"gov.",
	"graft",
	"grafting",
	"greeting",
	"greetings",
	"h",
	"h.",
	"had",
	"has",
	"hat",
	"have",
	"havin",
	"havin'",
	"having",
	"havin\u2019",
	"he",
	"he's",
	"headrest",
	"hen",
	"here",
	"hey",
	"he\u2019s",
	"hi",
	"hin",
	"his",
	"hours",
	"how",
	"how's",
	"how\u2019s",
	"huggers",
	"i",
	"i.",
	"i.e",
	"i.e.",
	"ia",
	"ia.",
	"ial",
	"ian",
	"ich",
	"ics",
	"id",
	"id.",
	"ied",
	"ies",
	"if.",
	"ill",
	"ill.",
	"in",
	"in'",
	"inc",
	"inc.",
	"ind",
	"ind.",
	"ine",
	"ing",
	"inn",
	"introductions",
	"in\u2019",
	"ion",
	"ire",
	"is",
	"is.",
	"isk",
	"iss",
	"ist",
	"it",
	"it's",
	"ite",
	"ith",
	"it\u2019s",
	"ive",
	"iz.",
	"j",
	"j.",
	"jan",
	"jan.",
	"johnson",
	"jr",
	"jr.",
	"jul",
	"jul.",
	"jun",
	"jun.",
	"k",
	"k.",
	"kan",
	"kan.",
	"kans",
	"kans.",
	"ked",
	"ket",
	"kla",
	"ky",
	"ky.",
	"l",
	"l.",
	"la",
	"la.",
	"laminectomy",
	"laparoscopic",
	"led",
	"leg",
	"let",
	"let's",
	"let\u2019s",
	"lexi",
	"lies",
	"lif",
	"ll",
	"ll.",
	"lo.",
	"loss",
	"lovin",
	"lovin'",
	"loving",
	"lovin\u2019",
	"low",
	"ltd",
	"ltd.",
	"m",
	"m.",
	"ma'am",
	"madam",
	"mal",
	"mar",
	"mar.",
	"marked",
	"marking",
	"mass",
	"mass.",
	"may",
	"ma\u2019am",
	"md",
	"md.",
	"med",
	"medical_procedure",
	"medical_role",
	"meds/equipment",
	"men",
	"messrs",
	"messrs.",
	"mich",
	"mich.",
	"might",
	"mil",
	"minimal",
	"minn",
	"minn.",
	"miss",
	"miss.",
	"mo",
	"mo.",
	"mont",
	"mont.",
	"morning",
	"mr",
	"mr.",
	"mrn",
	"mrs",
	"mrs.",
	"ms",
	"ms.",
	"mt",
	"mt.",
	"must",
	"my",
	"n",
	"n's",
	"n't",
	"n.",
	"n.c.",
	"n.d.",
	"n.h.",
	"n.j.",
	"n.m.",
	"n.y.",
	"na",
	"nal",
	"name",
	"nc.",
	"nd.",
	"neb",
	"neb.",
	"nebr",
	"nebr.",
	"need",
	"neurosurgeon",
	"nev",
	"nev.",
	"ngs",
	"nn.",
	"no",
	"not",
	"nothin",
	"nothin'",
	"nothing",
	"nothin\u2019",
	"nov",
	"nov.",
	"ns.",
	"nt",
	"nt.",
	"nuff",
	"nurse",
	"nuthin",
	"nuthin'",
	"nuthin\u2019",
	"n\u2019s",
	"n\u2019t",
	"o",
	"o'clock",
	"o's",
	"o.",
	"o.0",
	"o.O",
	"o.o",
	"o_0",
	"o_O",
	"o_o",
	"ock",
	"oct",
	"oct.",
	"ody",
	"oes",
	"of",
	"of.",
	"ogy",
	"oin",
	"okla",
	"okla.",
	"ol",
	"ol'",
	"old",
	"olo",
	"ol\u2019",
	"omy",
	"on",
	"one",
	"onn",
	"ons",
	"ont",
	"ood",
	"oon",
	"or",
	"ord",
	"ore",
	"ore.",
	"orp",
	"ort",
	"os.",
	"ose",
	"oss",
	"ought",
	"our",
	"ous",
	"out",
	"ov.",
	"own",
	"o\u2019clock",
	"o\u2019s",
	"p",
	"p.",
	"p.m",
	"p.m.",
	"pa",
	"pa.",
	"patient",
	"ph",
	"ph.d.",
	"pic",
	"place",
	"pm",
	"position",
	"potential",
	"pr.",
	"pressure",
	"products",
	"prof",
	"prof.",
	"prone",
	"pt.",
	"q",
	"q.",
	"r",
	"r.",
	"radiology",
	"rah",
	"re",
	"re.",
	"ready",
	"red",
	"redosing",
	"ree",
	"relieve",
	"rep",
	"rep.",
	"report",
	"required",
	"requirement",
	"res",
	"resident",
	"retrieve",
	"reu",
	"rev",
	"rev.",
	"rgo",
	"risk",
	"riz",
	"rk.",
	"rof",
	"ros",
	"round",
	"rp.",
	"rs.",
	"rse",
	"rub",
	"s",
	"s's",
	"s.",
	"s.c.",
	"saphenous",
	"scds",
	"scheduled",
	"scrub",
	"sen",
	"sen.",
	"sep",
	"sep.",
	"sept",
	"sept.",
	"sh.",
	"sha",
	"shall",
	"she",
	"she's",
	"she\u2019s",
	"should",
	"site",
	"sites",
	"smith",
	"somethin",
	"somethin'",
	"something",
	"somethin\u2019",
	"son",
	"space",
	"specimen",
	"spinal",
	"srs",
	"ss.",
	"st",
	"st.",
	"standby",
	"start",
	"stockings",
	"studies",
	"supine",
	"surgeon",
	"s\u2019s",
	"t",
	"t's",
	"t.",
	"ta",
	"td.",
	"tech",
	"technician",
	"ted",
	"tenn",
	"tenn.",
	"tes",
	"thank",
	"that",
	"that's",
	"that\u2019s",
	"the",
	"them",
	"there",
	"there's",
	"there\u2019s",
	"these",
	"they",
	"this",
	"this's",
	"this\u2019s",
	"those",
	"tic",
	"timeout",
	"to",
	"two",
	"t\u2019s",
	"u",
	"u.",
	"uff",
	"ug.",
	"ul.",
	"uld",
	"un.",
	"und",
	"undergo",
	"up",
	"ure",
	"urs",
	"us",
	"use",
	"ust",
	"v",
	"v.",
	"v.s",
	"v.s.",
	"v.v",
	"v_v",
	"va",
	"va.",
	"ve",
	"vein",
	"verified",
	"vin",
	"vs",
	"vs.",
	"w",
	"w's",
	"w.",
	"w/o",
	"warming",
	"was",
	"wash",
	"wash.",
	"we",
	"were",
	"what",
	"what's",
	"what\u2019s",
	"when",
	"when's",
	"when\u2019s",
	"where",
	"where's",
	"where\u2019s",
	"who",
	"who's",
	"who\u2019s",
	"why",
	"why's",
	"why\u2019s",
	"will",
	"wis",
	"wis.",
	"with",
	"without",
	"wo",
	"would",
	"w\u2019s",
	"x",
	"x'",
	"x'x",
	"x'xxxx",
	"x.",
	"x.X",
	"x.d",
	"x.x",
	"x.x.",
	"x/x",
	"xD",
	"xDD",
	"xX",
	"xXX",
	"x_X",
	"x_d",
	"x_x",
	"xd",
	"xdd",
	"xx",
	"xx'",
	"xx'x",
	"xx'xx",
	"xx.",
	"xxx",
	"xxx'x",
	"xxx.",
	"xxx/xx",
	"xxxx",
	"xxxx'",
	"xxxx'x",
	"xxxx\u2019",
	"xxxx\u2019x",
	"xxx\u2019x",
	"xx\u2019",
	"xx\u2019x",
	"xx\u2019xx",
	"x\u2019",
	"x\u2019x",
	"x\u2019xxxx",
	"x\ufe35x",
	"y",
	"y'",
	"y's",
	"y.",
	"yes",
	"you",
	"y\u2019",
	"y\u2019s",
	"z",
	"z.",
	"\|",
	"}",
	"\u00a0",
	"\u00ac",
	"\u00ac_\u00ac",
	"\u00af",
	"\u00af\\(x)/\u00af",
	"\u00af\\(\u30c4)/\u00af",
	"\u00b0",
	"\u00b0C.",
	"\u00b0F.",
	"\u00b0K.",
	"\u00b0X.",
	"\u00b0c.",
	"\u00b0f.",
	"\u00b0k.",
	"\u00b0x.",
	"\u00e4",
	"\u00e4.",
	"\u00f6",
	"\u00f6.",
	"\u00fc",
	"\u00fc.",
	"\u0ca0",
	"\u0ca0_\u0ca0",
	"\u0ca0\ufe35\u0ca0",
	"\u2014",
	"\u2018",
	"\u2018S",
	"\u2018X",
	"\u2018s",
	"\u2018x",
	"\u2019",
	"\u2019-(",
	"\u2019-)",
	"\u2019Cause",
	"\u2019Cos",
	"\u2019Coz",
	"\u2019Cuz",
	"\u2019S",
	"\u2019X",
	"\u2019Xxx",
	"\u2019Xxxxx",
	"\u2019am",
	"\u2019bout",
	"\u2019cause",
	"\u2019cos",
	"\u2019coz",
	"\u2019cuz",
	"\u2019d",
	"\u2019em",
	"\u2019ll",
	"\u2019m",
	"\u2019nuff",
	"\u2019re",
	"\u2019s",
	"\u2019ve",
	"\u2019x",
	"\u2019xx",
	"\u2019xxx",
	"\u2019xxxx",
	"\u2019y",
	"\u2019\u2019",
	"\u2501",
	"\u253b",
	"\u253b\u2501\u253b",
	"\u256f",
	"\u25a1",
	"\ufe35",
	"\uff09"
	]