dbleek commited on
Commit
38aee5a
·
1 Parent(s): 0d30c2b

slight tweaks to code and README

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. milestone-3.py +3 -5
README.md CHANGED
@@ -11,7 +11,7 @@ pinned: false
11
  Project for CS-GY-6613 Spring 2023
12
 
13
  # Milestone 3
14
- USPTO Patentability Classifier:https://huggingface.co/spaces/dbleek/cs-gy-6613-project
15
 
16
  # Milestone 2
17
  Sentiment Analysis App:https://huggingface.co/spaces/dbleek/cs-gy-6613-project
 
11
  Project for CS-GY-6613 Spring 2023
12
 
13
  # Milestone 3
14
+ USPTO Patentability Classifier:https://huggingface.co/spaces/dbleek/cs-gy-6613-project-final
15
 
16
  # Milestone 2
17
  Sentiment Analysis App:https://huggingface.co/spaces/dbleek/cs-gy-6613-project
milestone-3.py CHANGED
@@ -31,7 +31,6 @@ dataset = dataset.sort("patent_number")
31
  model = torch.load("patent_classifier_v4.pt", map_location=torch.device("cpu"))
32
  tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased")
33
  tokenizer_kwargs = {'padding':True,'truncation':True}
34
- classifier = pipeline("text-classification", model=model, tokenizer=tokenizer, **tokenizer_kwargs)
35
 
36
  def load_data():
37
  selected_application = dataset.select([applications[st.session_state.id]])
@@ -47,11 +46,10 @@ applications = {}
47
  for ds_index, example in enumerate(dataset):
48
  applications.update({example["patent_number"]: ds_index})
49
  st.selectbox(
50
- "Select a sample patent application:", applications, on_change=load_data, key="id"
51
- )
52
 
53
  # Sample title/decision displayed for additional context only, not used with model
54
- st.text_input("Sample Title", key="title", value=dataset[0]["title"])
55
  st.text_input("Sample Decision", key="decision", value=dataset[0]["decision"])
56
 
57
  # Classifier input form
@@ -72,7 +70,7 @@ if submitted:
72
  pred = torch.softmax(logits, dim=1)
73
  score = pred[0][1] # index 1 of softmax output is probability that decision = ACCEPTED
74
  st.markdown(
75
- "This application's patentability score is **{}**".format(score)
76
  )
77
 
78
 
 
31
  model = torch.load("patent_classifier_v4.pt", map_location=torch.device("cpu"))
32
  tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased")
33
  tokenizer_kwargs = {'padding':True,'truncation':True}
 
34
 
35
  def load_data():
36
  selected_application = dataset.select([applications[st.session_state.id]])
 
46
  for ds_index, example in enumerate(dataset):
47
  applications.update({example["patent_number"]: ds_index})
48
  st.selectbox(
49
+ "Select a sample patent application:", applications, on_change=load_data, key="id")
 
50
 
51
  # Sample title/decision displayed for additional context only, not used with model
52
+ st.text_input("Sample Title", key="title", value=dataset[0]["title"],)
53
  st.text_input("Sample Decision", key="decision", value=dataset[0]["decision"])
54
 
55
  # Classifier input form
 
70
  pred = torch.softmax(logits, dim=1)
71
  score = pred[0][1] # index 1 of softmax output is probability that decision = ACCEPTED
72
  st.markdown(
73
+ "This application's patentability score is **{}**.".format(score)
74
  )
75
 
76