Sneha7 commited on
Commit
e4c07fc
Β·
verified Β·
1 Parent(s): 2f7e6f8

Create policy.py

Browse files
Files changed (1) hide show
  1. policy.py +18 -0
policy.py ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ from transformers import AutoModelForCausalLM, AutoTokenizer
3
+
4
+ def load_policy_model():
5
+ model_name = "microsoft/phi-2"
6
+
7
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
8
+ model = AutoModelForCausalLM.from_pretrained(
9
+ model_name,
10
+ device_map="auto",
11
+ torch_dtype=torch.float32
12
+ )
13
+
14
+ # Attach simple optimizer
15
+ optimizer = torch.optim.Adam(model.parameters(), lr=1e-5)
16
+ model.optimizer = optimizer
17
+
18
+ return model, tokenizer