Spaces:

keras-io
/

ner_with_transformers

Build error

App Files Files Community

ner_with_transformers / app.py

reichenbach

Indent Correction

95eebfd over 3 years ago

raw

history blame contribute delete

2.58 kB

	import os
	os.system('pip install tensorflow')

	import json
	import numpy as np
	import gradio as gr
	import tensorflow as tf
	from tensorflow import keras
	from huggingface_hub.keras_mixin import from_pretrained_keras

	class CustomNonPaddingTokenLoss(keras.losses.Loss):
	def __init__(self, name="custom_ner_loss"):
	super().__init__(name=name)

	def call(self, y_true, y_pred):
	loss_fn = keras.losses.SparseCategoricalCrossentropy(
	from_logits=True, reduction=keras.losses.Reduction.NONE
	)

	loss = loss_fn(y_true, y_pred)
	mask = tf.cast((y_true > 0), dtype=tf.float32)

	loss = loss * mask
	return tf.reduce_sum(loss) / tf.reduce_sum(mask)

	def lowercase_and_convert_to_ids(tokens):
	tokens = tf.strings.lower(tokens)

	return lookup_layer(tokens)

	def tokenize_and_convert_to_ids(text):
	tokens = text.split()
	return lowercase_and_convert_to_ids(tokens)


	def ner_tagging(text_1):

	with open('mapping.json','r') as f:
	mapping = json.load(f)

	ner_model = from_pretrained_keras("keras-io/ner-with-transformers",
	custom_objects={'CustomNonPaddingTokenLoss':CustomNonPaddingTokenLoss},
	compile=False)


	sample_input = tokenize_and_convert_to_ids(text_1)
	sample_input = tf.reshape(sample_input, shape=[1, -1])
	output = ner_model.predict(sample_input)
	prediction = np.argmax(output, axis=-1)[0]

	prediction = [mapping[str(i)] for i in prediction]

	text_2 = text_1.split(" ")
	output = []
	for w in range(len(text_2)):
	if prediction[w] != "O":
	output.extend([(text_2[w], prediction[w]), (" ", None)])
	else:
	output.extend([(text_2[w], None), (" ", None)])

	return output

	text_1 = gr.inputs.Textbox(lines=5)
	ner_tag = gr.outputs.Textbox()

	with open("vocab.json",'r') as f:
	vocab = json.load(f)

	lookup_layer = keras.layers.StringLookup(vocabulary=vocab['tokens'])

	iface = gr.Interface(ner_tagging,
	inputs=text_1,outputs=['highlight'], examples=[['EU rejects German call to boycott British lamb .'],
	["He said further scientific study was required and if it was found that action was needed it should be taken by the European Union ."]], title="Named Entity Recognition with Transformers",
	description = "Named Entity Recognition with Transformers on CoNLL2003 Dataset",
	article = "Author: <a href=\"https://huggingface.co/reichenbach\">Rishav Chandra Varma</a>")

	iface.launch()