3
e_Q                 @   s(   d dl Zd dlZd dlmZ dd ZdS )    N)BeautifulSoupc           	   C   s4  t jd} g }xtdt| D ]}t| j| d j | j| d< tjd}|j	d| j| d | j| d< tjd}|j	d| j| d | j| d< tj	dd| j| d }|j
| j| d	 | j| d
 || j| d | j| d g qW t j|d	d
dddgd}|jd t jd}g }xtdt|D ]}t|j| d j |j| d< tjd}|j	d|j| d |j| d< tjd}|j	d|j| d |j| d< tj	dd|j| d }|j
|j| d |j| d |j| d
 ||j| d |j| d g q.W t j|ddd
dddgd}|jd d S )Nzjobs_des.csvr   detailsz<.*?> z/<.*?>|&([a-z0-9]+|#[0-9]{1,6}|#x[0-9a-f]{1,6});z[^a-zA-Z0-9]+ idtitlecitystate_province)columnszclean_jobs.csvzresumes_des.csvresume_details	resume_id	person_idzclean_resumes.csv)pdread_csvrangelenr   ilocZget_textrecompilesubappend	DataFrameto_csv)j_dfZ	jobs_desciprawdfr_dfZresume_desc r   I/var/www/html/talenthub/backend/ai/resume-to-job-match/clean_dataframe.pyclean_jobs_resume_csv   s8    
 
 
 <

 
 
 2r!   )pandasr   r   bs4r   r!   r   r   r   r    <module>   s   