ash256 commited on
Commit
bee14b9
·
verified ·
1 Parent(s): 886d7a7

Upload RL-trained question generation model

Browse files
README.md CHANGED
@@ -1,13 +1,13 @@
1
  ---
2
  license: apache-2.0
 
3
  base_model: Qwen/Qwen3-4B-Instruct-2507
4
  tags:
5
- - question-generation
6
- - rl
7
- - grpo
8
- - lora
9
  pipeline_tag: text-generation
10
- library_name: transformers
11
  ---
12
 
13
  # qwen3-4b-question-gen
@@ -41,4 +41,4 @@ from vllm import LLM, SamplingParams
41
  llm = LLM(model="ash256/qwen3-4b-question-gen")
42
  outputs = llm.generate(["Generate a technical screening question for a senior backend engineer:"], SamplingParams(max_tokens=256))
43
  print(outputs[0].outputs[0].text)
44
- ```
 
1
  ---
2
  license: apache-2.0
3
+ library_name: transformers
4
  base_model: Qwen/Qwen3-4B-Instruct-2507
5
  tags:
6
+ - question-generation
7
+ - rl
8
+ - grpo
9
+ - lora
10
  pipeline_tag: text-generation
 
11
  ---
12
 
13
  # qwen3-4b-question-gen
 
41
  llm = LLM(model="ash256/qwen3-4b-question-gen")
42
  outputs = llm.generate(["Generate a technical screening question for a senior backend engineer:"], SamplingParams(max_tokens=256))
43
  print(outputs[0].outputs[0].text)
44
+ ```
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:782f2b7794eb91ac319f0234bb3899c29e46d6ea74f7ca03ad1ff6821fe02607
3
  size 4967215360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3320e2e0bc614646cef2b27cde2eea518da80f31e63e0f346ad61c7750c9bf49
3
  size 4967215360
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40b2c71e5d756671bf45f13107512d3ff17b2cf36d5bc7522ab4714b5de2fc8e
3
  size 3077766632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb50315a4622cc96217c77044dad2c33ead85bd281c77e4427997a991f01ce15
3
  size 3077766632