Skip to content

Commit 5ca4b35

Browse files
committed
added a list of explicit organizations
1 parent 6b3082a commit 5ca4b35

File tree

4 files changed

+20
-4
lines changed

4 files changed

+20
-4
lines changed

cvscan/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,7 @@ def show(self):
5959
"phone_numbers" : self.phone_numbers,
6060
"emails" : self.emails,
6161
"urls" : self.URLs,
62-
"skills" : self.skills,
62+
# "skills" : self.skills,
6363
"jobs" : self.job_positions,
6464
"job category" : self.category,
6565
"employers" : self.employers,

cvscan/data/job_positions/scraping_jobs.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@
2020
job_categories = ws.__getitem__("D")
2121
for title,category in zip(job_titles[1:],job_categories[1:]):
2222
if title.value:
23-
jobs[title.value] = category.value
23+
jobs[title.value.lower()] = category.value.lower()
2424

2525
with open('positions','wb') as fp:
2626
pickle.dump(jobs,fp)
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
(lp0
2+
S'Skcript'
3+
p1
4+
aS'Hasura'
5+
p2
6+
a.

cvscan/language_parser.py

Lines changed: 12 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -143,9 +143,8 @@ def fetch_employers_util(resume_text, job_positions, organizations, priority):
143143
lines_back -= 1
144144
end += 1
145145
line = temp_resume[start:end].lower()
146-
147146
for org in organizations:
148-
if org.lower() in line:
147+
if org.lower() in line and org.lower() not in job_positions:
149148
if 'present' in line:
150149
if org.lower().capitalize() in employers:
151150
employers.remove(org.lower().capitalize())
@@ -185,7 +184,18 @@ def fetch_employers(resume_text, job_positions):
185184
organizations,False)
186185
current_employers.extend(cur_emps)
187186
employers.extend(emps)
187+
188+
with open(dirpath.PKGPATH +
189+
'/data/organizations/explicit_organizations') as fp:
190+
organizations = pickle.load(fp)
188191

192+
cur_emps,emps = fetch_employers_util(resume_text, job_positions,
193+
organizations,True)
194+
current_employers.extend([emp for emp in cur_emps
195+
if emp not in current_employers])
196+
employers.extend([emp for emp in emps
197+
if emp not in employers])
198+
189199
return current_employers,employers
190200

191201

0 commit comments

Comments
 (0)