Spaces:

atquiyaoni
/

Multilabel-DataScience-Tags-Classifier

Running

Multilabel-DataScience-Tags-Classifier / app.py

Atquiya-Labiba

Updated examples

bda2ed5 6 months ago

1.96 kB

	import gradio as gr
	import onnxruntime as rt
	from transformers import AutoTokenizer
	import torch, json

	tokenizer = AutoTokenizer.from_pretrained("distilroberta-base")


	with open("tag_types_encoded.json", "r") as fp:
	encode_tag_types = json.load(fp)

	tags = list(encode_tag_types.keys())

	inf_session = rt.InferenceSession('question-classifier-quantized.onnx')
	input_name = inf_session.get_inputs()[0].name
	output_name = inf_session.get_outputs()[0].name

	def classify_question_tags(description):
	input_ids = tokenizer(description)['input_ids'][:512]
	logits = inf_session.run([output_name], {input_name: [input_ids]})[0]
	logits = torch.FloatTensor(logits)
	probs = torch.sigmoid(logits)[0]

	return dict(zip(tags, map(float, probs)))

	demo = gr.Interface(
	fn=classify_question_tags,
	inputs=gr.Textbox(lines=8, placeholder="Enter your question here..."),
	outputs=gr.Label(num_top_classes=5),
	examples = [
	"I want to develop a machine learning model that predicts the correct medicine dosage required to keep a specific lab value within the target range of 5 to 7. I also have several other predictor variables available. I am unsure which machine learning algorithm would be most suitable for deployment and use with future patients. Additionally, should I define the outcome as binary (1 if the value is between 5 and 7, and 0 otherwise), or is there a better approach?",
	"What is the best way to evaluate performance of Generative Adverserial Network (GAN)? Perhaps measuring the distance between two distributions or maybe something else?",
	"Suppose that I have a file which has thousands of skills starting from A-Z. Now, I would like to create a model that can group similar skills together (example neural network and SVM can group together). I know that I can use NLP for this problem, but I'm not sure about the algorithm that I can use to get the best result."
	],
	)
	demo.launch(inline=False)