From a486d78b06488aead982633501829138df7ff01f Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Fri, 28 Jun 2024 21:47:48 +0200 Subject: [PATCH 01/18] Initial commit with project files --- .gitignore | 9 + LICENCE | 21 ++ README.md | 103 +++++++- config.json | 361 ++++++++++++++++++++++++- configExample.json | 41 +++ main.py | 645 ++++++++++++++++++++++++++++++++++----------- 6 files changed, 1015 insertions(+), 165 deletions(-) create mode 100644 .gitignore create mode 100644 LICENCE create mode 100644 configExample.json diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..54f2283 --- /dev/null +++ b/.gitignore @@ -0,0 +1,9 @@ +# Ignore everything +* + +# Allow specific files +!.gitignore +!main.py +!configExample.json +!README.md +!LICENCE \ No newline at end of file diff --git a/LICENCE b/LICENCE new file mode 100644 index 0000000..8df1a01 --- /dev/null +++ b/LICENCE @@ -0,0 +1,21 @@ +MIT License + +Copyright (c) 2022 dilaratznr + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. \ No newline at end of file diff --git a/README.md b/README.md index 8729077..6375aae 100644 --- a/README.md +++ b/README.md @@ -1,31 +1,108 @@ # EasyApply-Linkedin -With this tool you can easily automate the process of applying for jobs on LinkedIn! +With this tool, you can easily automate the process of applying for jobs on LinkedIn! -## Getting started +## Getting Started These instructions will get you a copy of the project up and running on your local machine for development and testing purposes. ### Prerequisites 1. Install selenium. I used `pip` to install the selenium package. - -`pip install selenium` + ```sh + pip install selenium + ``` 2. Selenium requires a driver to interface with the chosen browser. Make sure the driver is in your path, you will need to add your `driver_path` to the `config.json` file. -I used the Chrome driver, you can download it [here](https://sites.google.com/a/chromium.org/chromedriver/downloads). You can also download [Edge](https://developer.microsoft.com/en-us/microsoft-edge/tools/webdriver/), [Firefox](https://github.com/mozilla/geckodriver/releases) or [Safari](https://webkit.org/blog/6900/webdriver-support-in-safari-10/). Depends on your preferred browser. + I used the Chrome driver, you can download it [here](https://sites.google.com/a/chromium.org/chromedriver/downloads). You can also download drivers for [Edge](https://developer.microsoft.com/en-us/microsoft-edge/tools/webdriver/), [Firefox](https://github.com/mozilla/geckodriver/releases), or [Safari](https://webkit.org/blog/6900/webdriver-support-in-safari-10/), depending on your preferred browser. + +### Installation + +1. Clone the repository: + ```sh + git clone https://github.com/your_username/easyapply-linkedin.git + cd easyapply-linkedin + ``` + +2. Install the necessary packages: + ```sh + pip install -r requirements.txt + ``` + +3. Update the `config.json` file with your information: + ```json + { + "email": "example@example.com", + "password": "securePassword123!", + "keywords": ["Web Developer", "JavaScript", "React"], + "locations": ["New York", "Los Angeles", "San Francisco"], + "driver_path": "/usr/local/bin/chromedriver", + "sortBy": "Alphabetical", + "filters": { + "easy_apply": true, + "experience": ["Internship", "Entry Level", "Associate", "Mid-Senior Level", "Director", "Executive"], + "jobType": ["Full-Time", "Part-Time", "Contract", "Internship", "Temporary"], + "timePostedRange": ["Any Time", "Last Month", "Past Week", "Past 24 Hours"], + "workplaceType": ["Remote", "Hybrid", "On-site"], + "less_than_10_applicants": true, + "commitments": ["Full-Time", "Part-Time", "Contract", "Temporary", "Volunteer"] + }, + "experience": [ + { + "title": "Junior Web Developer", + "description": "Developing responsive web applications using JavaScript and React.", + "date": "Jan 2023 - Present", + "company": "Example Company" + } + ], + "projects": [ + { + "title": "Project Alpha", + "desc": "A project description here...", + "link": "#", + "skills": ["JavaScript", "React", "Node.js"] + } + ], + "skills": [ + "JavaScript", + "React", + "Node.js", + "Express", + "MongoDB" + ], + "user_inputs": {} + } + ``` ### Usage -Fork and clone/download the repository and change the configuration file with: +1. Run the application: + ```sh + python main.py + ``` + +### Features + +- **Automated Job Applications**: Automatically apply to jobs that match your keywords and location. +- **Filter Options**: Customize filters for experience level, job type, time posted, workplace type, and more. +- **Logging**: Keep track of errors and the companies you've applied to. + +### Customization + +You can customize the job search and application process by editing the `config.json` file: +- **email**: Your LinkedIn email address. +- **password**: Your LinkedIn password. +- **keywords**: Keywords for finding specific job titles (e.g., "Machine Learning Engineer", "Data Scientist"). +- **locations**: Locations where you are currently looking for a position. +- **driver_path**: Path to your downloaded WebDriver. +- **sortBy**: Sort order for job listings. +- **filters**: Various filters to narrow down the job search (e.g., easy apply, experience level, job type, etc.). + +### Contributing -* Your email linked to LinkedIn. -* Your password. -* Keywords for finding specific job titles fx. Machine Learning Engineer, Data Scientist, etc. -* The location where you are currently looking for a position. -* The driver path to your downloaded webdriver. +Please feel free to comment or give suggestions/issues. Fork and submit pull requests for any enhancements or bug fixes. -Run `python main.py`. +### License -Please feel free to comment or give suggestions/issues. +This project is licensed under the MIT License - see the [LICENSE](LICENSE) file for details. diff --git a/config.json b/config.json index 0b432a4..f32f4bf 100644 --- a/config.json +++ b/config.json @@ -1,7 +1,358 @@ { - "email" : "your_email", - "password" : "your_password", - "keywords" : "your_keywords", - "location" : "your_location", - "driver_path" : "your_path_to_webdriver" + "email": "sendmessage@gabo.email", + "password": "*******,********", + "keywords": [ + "TypeScript Engineer", + "Angular Frontend", + "React Frontend", + "React Native", + "Node backend", + "JavaScript Full-Stack" + ], + "locations": [ + "Belgium", + "Netherlands", + "DACH", + "Benelux", + "United Kingdom", + "Switzerland", + "Spain", + "United States", + "European Union", + "European Economic Area", + "Germany" + ], + "driver_path": "/usr/local/bin/geckodriver", + "sortBy": "R", + "filters": { + "easy_apply": true, + "experience": [ + "Entry level", + "Associate" + ], + "jobType": [ + "Full-time", + "Contract" + ], + "timePostedRange": [ + "Past Week" + ], + "workplaceType": [ + "Remote" + ], + "less_than_10_applicants": false + }, + "experience": [ + { + "title": "Full TypeScript Stack Engineer", + "description": "As a Full-Stack TypeScript Engineer at Beyondbmi, I spearhead the development of an advanced online weight loss clinic platform. Utilizing Angular and Bootstrap for the front-end and Express with TypeORM for the back-end, I ensure consistent and reliable performance across the stack with TypeScript. My role involves implementing HIPAA-compliant encryption protocols to safeguard patient data, developing an Android application with React Native, and deploying AWS Lambda functions and AWS Cognito for secure authentication. My contributions have enhanced user experience, data security, and the platform's scalability.", + "date": "Nov 2022 - Present", + "company": "Beyondbmi" + }, + { + "title": "Software Engineer", + "description": "At GABO, I collaborate on a variety of projects, focusing on developing e-commerce sites, corporate websites, and online presences for small businesses. My work emphasizes Search Engine Optimization (SEO) to improve visibility and engagement. Using JavaScript frameworks, WordPress, PHP, and other tools, I deliver tailored, optimized web solutions. My role has honed my versatility in web development and client relationship management, ensuring long-term client satisfaction and successful project outcomes.", + "date": "Nov 2022 - Present", + "company": "GABO" + }, + { + "title": "User Interface Engineer", + "description": "During my internship at talenTeal, I led the comprehensive redesign of the company\u2019s landing page to enhance user experience (UX) and user interface (UI). My focus was on creating an intuitive and navigable website, resulting in improved accessibility and user engagement. This project demonstrated my ability to apply front-end development skills effectively to achieve significant improvements in digital interaction and user satisfaction.", + "date": "Jul 2022 - Aug 2022", + "company": "talenTeal" + }, + { + "title": "Technical Support Specialist", + "description": "At Lujo Network, I enhanced the company\u2019s security infrastructure by implementing firewalls and establishing robust backup systems. I also managed databases, developed website segments, and conducted security training sessions. My efforts improved the company\u2019s digital security framework and online presence, showcasing my ability to handle both technical support and development tasks effectively.", + "date": "Feb 2022 - Mar 2022", + "company": "Lujo Network" + }, + { + "title": "Freelancer", + "description": "I provided web solutions, applying a range of technologies to address client requirements.", + "date": "Feb 2021 - Nov 2022" + } + ], + "projects": [ + { + "title": "BEYONDBMI", + "desc": "As a Full-Stack TypeScript Engineer at Beyondbmi, I spearhead the development of an advanced online weight loss clinic platform. Utilizing Angular and Bootstrap for the front-end and Express with TypeORM for the back-end, I ensure consistent and reliable performance across the stack with TypeScript. My role involves implementing HIPAA-compliant encryption protocols to safeguard patient data, developing an Android application with React Native, and deploying AWS Lambda functions and AWS Cognito for secure authentication. My contributions have enhanced user experience, data security, and the platform's scalability.", + "link": "", + "skills": [ + "JavaScript", + "Angular", + "TypeScript", + "Bootstrap", + "React Native", + "Metro", + "AWS", + "Express", + "TypeORM", + "Postgres", + "Jest", + "CI/CD", + "Docker", + "Jira", + "Bitbucket", + "Git", + "Stripe" + ] + }, + { + "title": "GABO", + "desc": "The GABO Landing Page is a modern, visually appealing website built using the Astro framework, leveraging Solid.js for reactive UI components, Tailwind CSS for efficient styling, and Vercel for scalable hosting. This project integrates Better SQLite3 for lightweight database management, Gray Matter and Marked for markdown content handling, and Next.js with React for dynamic, interactive components. Featuring fast load times, smooth user experience, and improved SEO, the site employs Vercel Analytics and Speed Insights for monitoring performance. Key technologies include Astro, Solid.js, Tailwind CSS, Vercel, Next.js, React, Git, and GitHub.", + "link": "", + "skills": [ + "JavaScript", + "Astro", + "Solid.js", + "Tailwind CSS", + "Vercel", + "Next.js", + "React", + "TypeScript", + "Git", + "GitHub" + ] + }, + { + "title": "TALENTEAL", + "desc": "I led the comprehensive redesign of the company\u2019s landing page to enhance user experience (UX) and user interface (UI). My focus was on creating an intuitive and navigable website, resulting in improved accessibility and user engagement. This project demonstrated my ability to apply front-end development skills effectively to achieve significant improvements in digital interaction and user satisfaction.", + "link": "", + "skills": [ + "JavaScript", + "React", + "Redux", + "Django", + "UI/UX Design", + "Sass", + "Git", + "GitHub" + ] + }, + { + "title": "LUJO NETWORK", + "desc": "At Lujo Network, I led the design and development of the sign-in and sign-up pages, implementing secure forms and internationalization in several languages, along with data validation for the forms. I enhanced the company\u2019s security infrastructure by implementing firewalls and establishing robust backup systems. I also managed databases, developed website segments, and conducted security training sessions. My efforts improved the company\u2019s digital security framework and online presence, showcasing my ability to handle both technical support and development tasks effectively.", + "link": "", + "skills": [ + "JavaScript", + "HTML", + "CSS", + "Database Management", + "Cybersecurity" + ] + }, + { + "title": "EXA MONSTER", + "desc": "Exa Monster is a secure cloud storage solution that prioritizes user privacy. Developed as a SaaS application using Laravel, WordPress, and PHP, and deployed with Hetzner Cloud, it offers robust and secure storage capabilities. The platform also includes a mobile app built with React Native, providing users with seamless access to their data on the go.", + "link": "", + "skills": [ + "Laravel", + "WordPress", + "PHP", + "React Native", + "Hetzner", + "SaaS", + "Stripe" + ] + }, + { + "title": "IMALEVANTE", + "desc": "I designed and developed the Imalevante company landing page using WordPress and PHP. The project involved creating a visually appealing and functional website that effectively represents the company's brand and services.", + "link": "", + "skills": [ + "WordPress", + "PHP" + ] + }, + { + "title": "ROUTEU", + "desc": "RouteU is a fully open-sourced route management site built with the MERN stack. This project offers users the ability to manage and share routes. It is deployed on Vercel and Heroku, providing high availability and performance. The site features a modern UI developed with React, Bootstrap, and Ant Design, and it uses MongoDB Atlas for robust data management.", + "link": "https://route-u.vercel.app", + "skills": [ + "React.js", + "CSS", + "Bootstrap", + "Ant Design", + "Grommet", + "Sass", + "HTML", + "Axios", + "React Router", + "MongoDB", + "Redux", + "Express", + "Node.js" + ] + }, + { + "title": "FIGHT GAME", + "desc": "StreetFighter-like OSG (Open Sourced Game) is a simple, open-sourced fighting game inspired by Street Fighter. Developed with HTML, CSS, and Vanilla JavaScript, the game is designed for two players. It is hosted on GitHub Pages, offering easy access and a fun gaming experience.", + "link": "https://gabo-tech.github.io/StreetFighter-like-OSG", + "skills": [ + "HTML", + "CSS", + "JavaScript" + ] + }, + { + "title": "QUIZ", + "desc": "Custom Quiz is an open-sourced quiz game that uses the Open Trivia API and supports custom questions. Developed with HTML, CSS, and Vanilla JavaScript, the game offers a fun and interactive way to test knowledge on various topics. It is hosted on GitHub Pages.", + "link": "https://gabo-tech.github.io/Custom-Quizz", + "skills": [ + "HTML", + "CSS", + "JavaScript" + ] + }, + { + "title": "GABO SL", + "desc": "Gabo's Social Life is a fully open-sourced social media site built with the MERN stack. This project provides a platform for users to share and interact with content. It is deployed on Vercel and Heroku, ensuring high availability and performance. The site features modern UI components and comprehensive functionality, including user authentication, content sharing, and real-time updates.", + "link": "https://gabosl.com", + "skills": [ + "React.js", + "Sass", + "HTML", + "Axios", + "React Router", + "MongoDB", + "Redux", + "Cypress", + "Express", + "Node.js", + "Material UI", + "Swagger" + ] + }, + { + "title": "DGABO Token", + "desc": "Decentralyized GABO Token is a personal cryptocurrency project developed using JavaScript and Motoko for smart contracts. Although not deployed due to high blockchain fees, this project demonstrates the process of creating and managing a token on the Internet Computer blockchain. The project includes a web mockup and emulator setup instructions for local development.", + "link": "https://github.com/Gabo-Tech/Web3-Token-and-Faucet", + "skills": [ + "JavaScript", + "Motoko", + "HTML", + "CSS", + "React" + ] + }, + { + "title": "My Portfolio", + "desc": "This portfolio it's been designed with tailwinds and framer motion, includes several animaitons and some interactivity with background music to make the experience a bit more chilling. Has been developed with Next.js 14", + "link": "", + "skills": [ + "JavaScript", + "React", + "Next.js", + "Tailwind CSS", + "Framer Motion" + ] + }, + { + "title": "CHURCH OF JESUS CHRIST", + "desc": "This desktop application, developed using Tauri and Svelte, provides a convenient and efficient way to access and read the scriptures from the website of The Church of Jesus Christ of Latter-day Saints. The app features cross-platform compatibility (Windows, macOS, Linux), easy navigation, and a clean interface.", + "link": "https://github.com/Gabo-Tech/Scriptures-of-The-Church-of-Jesus-Christ-of-Latter-Day-Saints", + "skills": [ + "Tauri", + "Svelte", + "JavaScript", + "Node.js" + ] + } + ], + "skills": [ + "React", + "Angular", + "Svelte", + "Solid.js", + "Next.js", + "Astro", + "Tailwind CSS", + "Bootstrap", + "Ant Design", + "Material UI", + "Metro", + "React Native", + "CSS", + "HTML", + "Markdown", + "Sass", + "Grommet", + "Node.js", + "Express", + "TypeORM", + "PostgreSQL", + "Laravel", + "WordPress", + "PHP", + "Hetzner", + "Sequelize", + "Spring Boot", + "GraphQL", + "Apollo", + "JWT", + "Jest", + "Cypress", + "Playwright", + "Postman", + "Firebase", + "MongoDB", + "Redux", + "Axios", + "Swagger", + "Motoko", + "CI/CD", + "Git", + "Docker", + "Jira", + "Bitbucket", + "GitHub Actions", + "AWS", + "Vercel", + "DigitalOcean", + "Heroku", + "Netlify", + "Expo", + "Tauri", + "Recoil", + "Zustand", + "Vite", + "Vitest", + "Bun", + "MySQL", + "MariaDB", + "Mocha", + "NPM", + "Yarn", + "Webpack" + ], + "user_inputs": { + "United Kingdom": { + "City\nCity": "Valencia, Valencian Community, Spain", + "What is your gender?\nWhat is your gender?": "Male", + "Do you consider yourself to be disabled as defined by the Equality Act 2010? The Equality Act defines disability as 'A physical or mental impairment which has a substantial and long-term effect on the person's ability to carry out normal day-to-day activities'.\nDo you consider yourself to be disabled as defined by the Equality Act 2010? The Equality Act defines disability as 'A physical or mental impairment which has a substantial and long-term effect on the person's ability to carry out normal day-to-day activities'.": "No", + "Do you require any particular arrangements to support you in the recruitment and selection process?\nDo you require any particular arrangements to support you in the recruitment and selection process?\nRequired": "No", + "Please provide details of the arrangements you require. If you are invited to interview, we will confirm the arrangements with you ahead of the appointment date and time.": "No arrangements required.", + "What is your ethnic origin?\nWhat is your ethnic origin?": "White: Any other background", + "I Agree Terms & Conditions": true, + "TV Advert": false, + "CV Library": false, + "CW Jobs": false, + "Indeed": false, + "Jobsite": false, + "LinkedIn": true, + "Will you now or in the future require sponsorship for employment visa status?\nWill you now or in the future require sponsorship for employment visa status?\nRequired": "No", + "What is your current location?": "Valencia, Valencian Community, Spain", + "Have you completed the following level of education: Bachelor's Degree?\nHave you completed the following level of education: Bachelor's Degree?\nRequired": "No", + "How many years of work experience do you have with Oracle Cloud?": "0", + "How many years of work experience do you have with Oracle ERP Implementations?": "0", + "How many years of work experience do you have with Source to Pay?": "0", + "Are you legally authorized to work in United Kingdom?\nAre you legally authorized to work in United Kingdom?\nRequired": "Yes", + "Legal Name (if different than above)": "Gabriel Clemente Ramos", + "How did you hear about this job?": "LinkedIn", + "This job post is for positions in the EMEA region. Please confirm if you have the right to work in Portugal and/or UK\nThis job post is for positions in the EMEA region. Please confirm if you have the right to work in Portugal and/or UK": "Yes", + "Do you now or will you in the future require immigration sponsorship to work at Cloudflare?\nDo you now or will you in the future require immigration sponsorship to work at Cloudflare?": "No", + "Acknowledge/Confirm": true + } + } } \ No newline at end of file diff --git a/configExample.json b/configExample.json new file mode 100644 index 0000000..fd36f61 --- /dev/null +++ b/configExample.json @@ -0,0 +1,41 @@ +{ + "email": "example@example.com", + "password": "securePassword123!", + "keywords": ["Web Developer", "JavaScript", "React"], + "locations": ["New York", "Los Angeles", "San Francisco"], + "driver_path": "/usr/local/bin/chromedriver", + "sortBy": "Alphabetical", + "filters": { + "easy_apply": true, + "experience": ["Internship", "Entry Level", "Associate", "Mid-Senior Level", "Director", "Executive"], + "jobType": ["Full-Time", "Part-Time", "Contract", "Internship", "Temporary"], + "timePostedRange": ["Any Time", "Last Month", "Past Week", "Past 24 Hours"], + "workplaceType": ["Remote", "Hybrid", "On-site"], + "less_than_10_applicants": true, + "commitments": ["Full-Time", "Part-Time", "Contract", "Temporary", "Volunteer"] + }, + "experience": [ + { + "title": "Junior Web Developer", + "description": "Developing responsive web applications using JavaScript and React.", + "date": "Jan 2023 - Present", + "company": "Example Company" + } + ], + "projects": [ + { + "title": "Project Alpha", + "desc": "A project description here...", + "link": "#", + "skills": ["JavaScript", "React", "Node.js"] + } + ], + "skills": [ + "JavaScript", + "React", + "Node.js", + "Express", + "MongoDB" + ], + "user_inputs": {} + } \ No newline at end of file diff --git a/main.py b/main.py index 0232efa..99e0df4 100644 --- a/main.py +++ b/main.py @@ -1,179 +1,530 @@ +import json +import time +import urllib.parse +import logging +from datetime import datetime, timedelta +from pathlib import Path from selenium import webdriver +from selenium.webdriver.common.by import By from selenium.webdriver.common.keys import Keys from selenium.webdriver.support import expected_conditions as EC from selenium.webdriver.support.ui import WebDriverWait -from selenium.webdriver.common.by import By -from selenium.common.exceptions import NoSuchElementException, ElementClickInterceptedException, NoSuchElementException -from selenium.webdriver.common.action_chains import ActionChains -import time -import re -import json +from selenium.common.exceptions import NoSuchElementException, ElementNotInteractableException, StaleElementReferenceException, TimeoutException, ElementClickInterceptedException +from selenium.webdriver.firefox.service import Service as FirefoxService class EasyApplyLinkedin: + BASE_URL = "https://www.linkedin.com/jobs/search/" + ERROR_LOG_PATH = Path("error_log.json") + APPLIED_COMPANIES_LOG_PATH = Path("applied_companies_log.json") - def __init__(self, data): - """Parameter initialization""" + TIME_POSTED_MAPPING = { + "Any Time": "", + "Last Month": "r2592000", + "Past Week": "r604800", + "Past 24 hours": "r86400" + } + + EXPERIENCE_MAPPING = { + "Internship": "1", + "Entry level": "2", + "Associate": "3", + "Mid-Senior level": "4", + "Director": "5", + "Executive": "6" + } + + WORKPLACE_TYPE_MAPPING = { + "Remote": "2", + "Hybrid": "3", + "On-site": "1" + } + + JOB_TYPE_MAPPING = { + "Full-time": "F", + "Part-time": "P", + "Contract": "C", + "Internship": "I", + "Temporary": "T" + } + + TITLE_MAPPING = { + "Engineer": "9", + "Developer": "25201", + "Manager": "25170", + "Specialist": "1456", + "Consultant": "3731" + } + COMMITMENTS_MAPPING = { + "Full-time": "1", + "Part-time": "2", + "Contract": "3", + "Temporary": "4", + "Volunteer": "5" + } + + LOCATION_MAPPING = { + "Switzerland": "106693272", + "Spain": "105646813", + "United States": "103644278", + "United Kingdom": "101165590", + "European Union": "91000000", + "European Economic Area": "91000002", + "DACH": "91000006", + "Benelux": "91000005", + "Netherlands": "102890719", + "Belgium":"100565514", + "Germany": "101282230" + } + + def __init__(self, data): + """Initialize the EasyApplyLinkedin instance with user data.""" self.email = data['email'] self.password = data['password'] - self.keywords = data['keywords'] - self.location = data['location'] - self.driver = webdriver.Chrome(data['driver_path']) + self.keywords = ' OR '.join(data['keywords']) + self.locations = data['locations'] + self.filters = data['filters'] + self.sort_by = data['sortBy'] + self.context_data = data + self.current_location_index = 0 + if 'user_inputs' not in self.context_data: + self.context_data['user_inputs'] = {} + firefox_service = FirefoxService(executable_path=data['driver_path']) + self.driver = webdriver.Firefox(service=firefox_service) + self.init_logging() + + def init_logging(self): + """Initialize logging for error and applied companies.""" + logging.basicConfig(level=logging.ERROR) + self.error_logger = logging.getLogger("ErrorLogger") + self.applied_companies = self.load_json(self.APPLIED_COMPANIES_LOG_PATH) + + def load_json(self, path): + """Load JSON data from the specified path.""" + if path.exists(): + with path.open('r') as file: + return json.load(file) + return {} + + def save_json(self, path, data): + """Save JSON data to the specified path.""" + with path.open('w') as file: + json.dump(data, file, indent=4) + + def log_error(self, error_msg): + """Log error messages with a timestamp.""" + errors = self.load_json(self.ERROR_LOG_PATH) + errors[str(datetime.now())] = error_msg + self.save_json(self.ERROR_LOG_PATH, errors) + self.cleanup_error_log() + + def cleanup_error_log(self): + """Clean up old error logs older than 1 day.""" + errors = self.load_json(self.ERROR_LOG_PATH) + cutoff = datetime.now() - timedelta(days=1) + errors = {k: v for k, v in errors.items() if datetime.fromisoformat(k) > cutoff} + self.save_json(self.ERROR_LOG_PATH, errors) + + def log_applied_company(self, company): + """Log the company to which an application was submitted.""" + self.applied_companies[company] = str(datetime.now()) + self.save_json(self.APPLIED_COMPANIES_LOG_PATH, self.applied_companies) + self.cleanup_applied_companies_log() + + def cleanup_applied_companies_log(self): + """Clean up logs of applied companies older than 2 weeks.""" + cutoff = datetime.now() - timedelta(weeks=2) + self.applied_companies = {k: v for k, v in self.applied_companies.items() if datetime.fromisoformat(v) > cutoff} + self.save_json(self.APPLIED_COMPANIES_LOG_PATH, self.applied_companies) def login_linkedin(self): - """This function logs into your personal LinkedIn profile""" - - # go to the LinkedIn login url - self.driver.get("https://www.linkedin.com/login") - - # introduce email and password and hit enter - login_email = self.driver.find_element_by_name('session_key') - login_email.clear() - login_email.send_keys(self.email) - login_pass = self.driver.find_element_by_name('session_password') - login_pass.clear() - login_pass.send_keys(self.password) - login_pass.send_keys(Keys.RETURN) - + """Log in to LinkedIn using the provided credentials.""" + try: + self.driver.get("https://www.linkedin.com/login") + WebDriverWait(self.driver, 10).until(EC.presence_of_element_located((By.NAME, 'session_key'))) + login_email = self.driver.find_element(By.NAME, 'session_key') + login_email.clear() + login_email.send_keys(self.email) + WebDriverWait(self.driver, 10).until(EC.presence_of_element_located((By.NAME, 'session_password'))) + login_pass = self.driver.find_element(By.NAME, 'session_password') + login_pass.clear() + login_pass.send_keys(self.password) + login_pass.send_keys(Keys.RETURN) + WebDriverWait(self.driver, 30).until(EC.presence_of_element_located((By.LINK_TEXT, 'Jobs'))) + except Exception as e: + self.log_error(f"Login error: {e}") + def job_search(self): - """This function goes to the 'Jobs' section a looks for all the jobs that matches the keywords and location""" - - # go to Jobs - jobs_link = self.driver.find_element_by_link_text('Jobs') - jobs_link.click() - - # search based on keywords and location and hit enter - search_keywords = self.driver.find_element_by_css_selector(".jobs-search-box__text-input[aria-label='Search jobs']") - search_keywords.clear() - search_keywords.send_keys(self.keywords) - search_location = self.driver.find_element_by_css_selector(".jobs-search-box__text-input[aria-label='Search location']") - search_location.clear() - search_location.send_keys(self.location) - search_location.send_keys(Keys.RETURN) - - def filter(self): - """This function filters all the job results by 'Easy Apply'""" - - # select all filters, click on Easy Apply and apply the filter - all_filters_button = self.driver.find_element_by_xpath("//button[@data-control-name='all_filters']") - all_filters_button.click() - time.sleep(1) - easy_apply_button = self.driver.find_element_by_xpath("//label[@for='f_LF-f_AL']") - easy_apply_button.click() - time.sleep(1) - apply_filter_button = self.driver.find_element_by_xpath("//button[@data-control-name='all_filters_apply']") - apply_filter_button.click() + """Perform job search based on keywords and locations.""" + while self.current_location_index < len(self.locations): + try: + WebDriverWait(self.driver, 20).until(EC.presence_of_element_located((By.LINK_TEXT, 'Jobs'))) + jobs_link = self.driver.find_element(By.LINK_TEXT, 'Jobs') + jobs_link.click() + WebDriverWait(self.driver, 20).until(EC.presence_of_element_located((By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']"))) + search_keywords = self.driver.find_element(By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']") + search_keywords.clear() + search_keywords.send_keys(self.keywords) + WebDriverWait(self.driver, 20).until(EC.presence_of_element_located((By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']"))) + search_location = self.driver.find_element(By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']") + search_location.clear() + search_location.send_keys(self.locations[self.current_location_index]) + search_keywords.click() + search_keywords.send_keys(Keys.RETURN) + + if not self.check_no_results(): + break + else: + print(f"No matching jobs found in {self.locations[self.current_location_index]}.") + self.current_location_index += 1 + + except TimeoutException: + print("Timeout while trying to access the Jobs page or elements on it.") + self.current_location_index += 1 + except Exception as e: + self.log_error(f"Job search error: {e}") + self.current_location_index += 1 + + def construct_url(self): + """Construct the URL for job search with applied filters.""" + current_location = self.locations[self.current_location_index] + params = { + "keywords": self.keywords, + "origin": "JOB_SEARCH_PAGE_JOB_FILTER", + "refresh": "true", + "sortBy": self.sort_by + } + + if self.filters.get("easy_apply"): + params["f_AL"] = "true" + + if self.filters.get("experience"): + params["f_E"] = ",".join([self.EXPERIENCE_MAPPING[exp] for exp in self.filters["experience"]]) + + if self.filters.get("jobType"): + params["f_JT"] = ",".join([self.JOB_TYPE_MAPPING[jt] for jt in self.filters["jobType"]]) + + if self.filters.get("timePostedRange"): + params["f_TPR"] = ",".join([self.TIME_POSTED_MAPPING[time] for time in self.filters["timePostedRange"]]) + + if self.filters.get("workplaceType"): + params["f_WT"] = ",".join([self.WORKPLACE_TYPE_MAPPING[wt] for wt in self.filters["workplaceType"]]) + + if self.filters.get("less_than_10_applicants"): + params["f_EA"] = "true" + + if current_location in self.LOCATION_MAPPING: + params["geoId"] = self.LOCATION_MAPPING[current_location] + + query_string = urllib.parse.urlencode(params, safe=",") + url = f"{self.BASE_URL}?{query_string}" + return url + + def apply_filters_and_search(self): + """Apply filters to the job search and navigate to the search URL.""" + while self.current_location_index < len(self.locations): + search_url = self.construct_url() + self.driver.get(search_url) + + if self.check_no_results(): + print(f"No matching jobs found in {self.locations[self.current_location_index]}.") + self.current_location_index += 1 + else: + break + + def check_no_results(self): + """Check if the job search resulted in no matches.""" + try: + no_results_element = self.driver.find_element(By.CSS_SELECTOR, "div.jobs-search-no-results-banner") + return no_results_element.is_displayed() + except NoSuchElementException: + return False + + def get_response_for_label(self, label_text): + """Get user response for a given label text.""" + current_location = self.locations[self.current_location_index] + if current_location in self.context_data['user_inputs']: + location_specific_inputs = self.context_data['user_inputs'][current_location] + if label_text in location_specific_inputs: + return location_specific_inputs[label_text] + + user_input = input(f"Please provide the answer for '{label_text}': ") + if current_location not in self.context_data['user_inputs']: + self.context_data['user_inputs'][current_location] = {} + self.context_data['user_inputs'][current_location][label_text] = user_input + self.update_config_file() + return user_input + + def get_checkbox_response_for_label(self, label_text): + """Get user response for a checkbox labeled by the given text.""" + current_location = self.locations[self.current_location_index] + if current_location in self.context_data['user_inputs']: + location_specific_inputs = self.context_data['user_inputs'][current_location] + if label_text in location_specific_inputs: + return location_specific_inputs[label_text] + + while True: + user_input = input(f"Do you want to check the box for '{label_text}'? (yes/no): ").strip().lower() + if user_input in ['yes', 'no']: + response = user_input == 'yes' + if current_location not in self.context_data['user_inputs']: + self.context_data['user_inputs'][current_location] = {} + self.context_data['user_inputs'][current_location][label_text] = response + self.update_config_file() + return response + + def get_radio_response_for_label(self, label_text, options): + """Get user response for a radio button group labeled by the given text.""" + current_location = self.locations[self.current_location_index] + if current_location in self.context_data['user_inputs']: + location_specific_inputs = self.context_data['user_inputs'][current_location] + if label_text in location_specific_inputs: + return location_specific_inputs[label_text] + + while True: + print(f"Please select an option for '{label_text}':") + for i, option in enumerate(options): + print(f"{i + 1}. {option}") + user_input = input("Enter the number of your choice: ").strip() + if user_input.isdigit() and 1 <= int(user_input) <= len(options): + response = options[int(user_input) - 1] + if current_location not in self.context_data['user_inputs']: + self.context_data['user_inputs'][current_location] = {} + self.context_data['user_inputs'][current_location][label_text] = response + self.update_config_file() + return response + + def update_config_file(self): + """Update the configuration file with the latest user inputs.""" + with open('config.json', 'w') as config_file: + json.dump(self.context_data, config_file, indent=4) def find_offers(self): - """This function finds all the offers through all the pages result of the search and filter""" - - # find the total amount of results (if the results are above 24-more than one page-, we will scroll trhough all available pages) - total_results = self.driver.find_element_by_class_name("display-flex.t-12.t-black--light.t-normal") - total_results_int = int(total_results.text.split(' ',1)[0].replace(",","")) - print(total_results_int) - - time.sleep(2) - # get results for the first page - current_page = self.driver.current_url - results = self.driver.find_elements_by_class_name("occludable-update.artdeco-list__item--offset-4.artdeco-list__item.p0.ember-view") - - # for each job add, submits application if no questions asked - for result in results: - hover = ActionChains(self.driver).move_to_element(result) - hover.perform() - titles = result.find_elements_by_class_name('job-card-search__title.artdeco-entity-lockup__title.ember-view') - for title in titles: - self.submit_apply(title) - - # if there is more than one page, find the pages and apply to the results of each page - if total_results_int > 24: - time.sleep(2) + """Find and apply to job offers.""" + while self.current_location_index < len(self.locations): + self.apply_filters_and_search() - # find the last page and construct url of each page based on the total amount of pages - find_pages = self.driver.find_elements_by_class_name("artdeco-pagination__indicator.artdeco-pagination__indicator--number") - total_pages = find_pages[len(find_pages)-1].text - total_pages_int = int(re.sub(r"[^\d.]", "", total_pages)) - get_last_page = self.driver.find_element_by_xpath("//button[@aria-label='Page "+str(total_pages_int)+"']") - get_last_page.send_keys(Keys.RETURN) - time.sleep(2) - last_page = self.driver.current_url - total_jobs = int(last_page.split('start=',1)[1]) - - # go through all available pages and job offers and apply - for page_number in range(25,total_jobs+25,25): - self.driver.get(current_page+'&start='+str(page_number)) - time.sleep(2) - results_ext = self.driver.find_elements_by_class_name("occludable-update.artdeco-list__item--offset-4.artdeco-list__item.p0.ember-view") - for result_ext in results_ext: - hover_ext = ActionChains(self.driver).move_to_element(result_ext) - hover_ext.perform() - titles_ext = result_ext.find_elements_by_class_name('job-card-search__title.artdeco-entity-lockup__title.ember-view') - for title_ext in titles_ext: - self.submit_apply(title_ext) - else: - self.close_session() - - def submit_apply(self,job_add): - """This function submits the application for the job add found""" - - print('You are applying to the position of: ', job_add.text) - job_add.click() - time.sleep(2) - - # click on the easy apply button, skip if already applied to the position + while True: + try: + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.CLASS_NAME, "scaffold-layout__list-container")) + ) + + job_list_container = self.driver.find_element(By.CLASS_NAME, "scaffold-layout__list-container") + job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") + + for index in range(len(job_list_items)): + try: + job_list_container = self.driver.find_element(By.CLASS_NAME, "scaffold-layout__list-container") + job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") + + job_item = job_list_items[index] + job_item.click() + time.sleep(2) + + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.CLASS_NAME, "jobs-search__job-details--wrapper")) + ) + + if self.job_already_applied(job_item): + print('Job already applied to, moving to next job...') + continue + + company_name = self.get_company_name(job_item) + if company_name and company_name in self.applied_companies: + print(f"Already applied to a job at {company_name}, skipping...") + continue + + job_details_wrapper = self.driver.find_element(By.CLASS_NAME, "jobs-search__job-details--wrapper") + + try: + apply_button = job_details_wrapper.find_element(By.CSS_SELECTOR, "button.jobs-apply-button.artdeco-button--primary") + apply_button.click() + time.sleep(2) + + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.CSS_SELECTOR, "div.jobs-easy-apply-modal")) + ) + + self.handle_easy_apply() + + if company_name: + self.log_applied_company(company_name) + + except NoSuchElementException: + print('No apply button found, continuing to next job...') + continue + + except (NoSuchElementException, ElementNotInteractableException, StaleElementReferenceException) as e: + print(f'Exception occurred: {e}, continuing to next job...') + self.log_error(f"Find offers error: {e}") + continue + + try: + pagination_container = self.driver.find_element(By.CLASS_NAME, "artdeco-pagination__pages") + next_page_button = pagination_container.find_element(By.XPATH, "//li[contains(@class, 'artdeco-pagination__indicator') and not(contains(@class, 'active selected'))]/button") + self.driver.execute_script("arguments[0].click();", next_page_button) + time.sleep(2) + except NoSuchElementException: + print("No more pages left.") + break + except TimeoutException: + print("Timeout while waiting for job list container.") + self.log_error("Timeout while waiting for job list container.") + break + + self.current_location_index += 1 + + def get_company_name(self, job_item): + """Extract the company name from a job listing.""" try: - in_apply = self.driver.find_element_by_xpath("//button[@data-control-name='jobdetails_topcard_inapply']") - in_apply.click() + company_element = job_item.find_element(By.CSS_SELECTOR, "div.artdeco-entity-lockup__subtitle span.job-card-container__primary-description") + return company_element.text.strip() except NoSuchElementException: - print('You already applied to this job, go to next...') - pass - time.sleep(1) + return None - # try to submit if submit application is available... + def job_already_applied(self, job_item): + """Check if a job has already been applied to.""" try: - submit = self.driver.find_element_by_xpath("//button[@data-control-name='submit_unify']") - submit.send_keys(Keys.RETURN) - - # ... if not available, discard application and go to next + applied_element = job_item.find_element(By.CSS_SELECTOR, "li.job-card-container__footer-item.job-card-container__footer-job-state.t-bold") + if "Applied" in applied_element.text: + return True except NoSuchElementException: - print('Not direct application, going to next...') + pass + + return False + + def handle_easy_apply(self): + """Handle the easy apply process.""" + while True: try: - discard = self.driver.find_element_by_xpath("//button[@data-test-modal-close-btn]") - discard.send_keys(Keys.RETURN) - time.sleep(1) - discard_confirm = self.driver.find_element_by_xpath("//button[@data-test-dialog-primary-btn]") - discard_confirm.send_keys(Keys.RETURN) - time.sleep(1) - except NoSuchElementException: - pass + modal_dialog = WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.CSS_SELECTOR, "div.artdeco-modal--layer-default.jobs-easy-apply-modal")) + ) + try: + next_button = modal_dialog.find_element(By.CSS_SELECTOR, "button[data-easy-apply-next-button]") + self.driver.execute_script("arguments[0].click();", next_button) + time.sleep(2) + except NoSuchElementException: + try: + review_button = modal_dialog.find_element(By.CSS_SELECTOR, "button[aria-label='Review your application']") + self.driver.execute_script("arguments[0].click();", review_button) + time.sleep(2) + except NoSuchElementException: + try: + submit_button = modal_dialog.find_element(By.CSS_SELECTOR, "button[aria-label='Submit application']") + self.driver.execute_script("arguments[0].click();", submit_button) + time.sleep(2) + print("Application submitted.") + self.handle_done_button() + break + except NoSuchElementException: + print('Submit button not found, continuing to next job...') + break + self.fill_form(modal_dialog) + except TimeoutException: + print('No more steps found, exiting...') + break - time.sleep(1) + def fill_form(self, modal_dialog): + """Fill out the application form.""" + form_elements = modal_dialog.find_elements(By.CSS_SELECTOR, "div[data-test-form-element]") + for element in form_elements: + try: + label = element.find_element(By.CSS_SELECTOR, "label, legend") + input_field = element.find_element(By.CSS_SELECTOR, "input, select, textarea") + label_text = label.text.strip() - def close_session(self): - """This function closes the actual session""" - - print('End of the session, see you later!') - self.driver.close() + if input_field.tag_name == "input" and input_field.get_attribute("type") == "text": + response = self.get_response_for_label(label_text) + if input_field.get_attribute("value") == "": + input_field.send_keys(response) + time.sleep(1) + input_field.send_keys(Keys.ARROW_DOWN) + input_field.send_keys(Keys.RETURN) + + elif input_field.tag_name == "select": + response = self.get_response_for_label(label_text) + select_options = input_field.find_elements(By.TAG_NAME, "option") + for option in select_options: + if option.get_attribute("value") == response: + option.click() + break - def apply(self): - """Apply to job offers""" + elif input_field.tag_name == "textarea": + response = self.get_response_for_label(label_text) + if input_field.get_attribute("value") == "": + input_field.send_keys(response) - self.driver.maximize_window() - self.login_linkedin() - time.sleep(5) - self.job_search() - time.sleep(5) - self.filter() - time.sleep(2) - self.find_offers() - time.sleep(2) - self.close_session() + elif input_field.tag_name == "input" and input_field.get_attribute("type") == "checkbox": + checkboxes = element.find_elements(By.CSS_SELECTOR, "input[type='checkbox']") + for checkbox in checkboxes: + checkbox_label = checkbox.find_element(By.XPATH, "./following-sibling::label").text.strip() + response = self.get_checkbox_response_for_label(checkbox_label) + if response is not None: + try: + if response and not checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + elif not response and checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + except ElementClickInterceptedException: + self.driver.execute_script("arguments[0].click();", checkbox) + except StaleElementReferenceException: + checkbox = element.find_element(By.XPATH, f".//input[@type='checkbox' and ./following-sibling::label[text()='{checkbox_label}']]") + if response and not checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + elif not response and checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + elif input_field.tag_name == "input" and input_field.get_attribute("type") == "radio": + radio_buttons = element.find_elements(By.CSS_SELECTOR, "input[type='radio']") + for radio in radio_buttons: + radio_label = radio.find_element(By.XPATH, "./following-sibling::label").text.strip() + response = self.get_radio_response_for_label(label_text, [rb.find_element(By.XPATH, "./following-sibling::label").text.strip() for rb in radio_buttons]) + if response.lower() == radio_label.lower(): + try: + radio.click() + except ElementClickInterceptedException: + self.driver.execute_script("arguments[0].click();", radio) + break -if __name__ == '__main__': + except NoSuchElementException: + continue + try: + next_button = modal_dialog.find_element(By.CSS_SELECTOR, "button[data-easy-apply-next-button]") + next_button.click() + time.sleep(2) + except NoSuchElementException: + print('Next button not found, form might be complete or there is an issue.') + + def handle_done_button(self): + """Handle the final done button after application submission.""" + try: + done_button = WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.CSS_SELECTOR, "button.artdeco-button.artdeco-button--primary")) + ) + done_button.click() + time.sleep(2) + except TimeoutException: + print("Done button not found, skipping to next job.") + + def close_session(self): + """Close the browser session.""" + print('End of the session') + self.driver.close() + self.driver.quit() + + def handle_captcha(self): + """Handle CAPTCHA prompts manually.""" + print("CAPTCHA detected. Please solve the CAPTCHA manually and then press Enter to continue...") + input() + +if __name__ == "__main__": with open('config.json') as config_file: data = json.load(config_file) - bot = EasyApplyLinkedin(data) - bot.apply() \ No newline at end of file + bot.login_linkedin() + bot.job_search() + bot.find_offers() + bot.close_session() From a37abde50c5ea4fbee4e1b64c1acd0eb9829655c Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Fri, 28 Jun 2024 21:48:33 +0200 Subject: [PATCH 02/18] Initial commit with project files --- .gitignore | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index 54f2283..802732e 100644 --- a/.gitignore +++ b/.gitignore @@ -1,6 +1,6 @@ # Ignore everything * - +config.json # Allow specific files !.gitignore !main.py From a3b29d5aa1058885b565a681bc640c1161047bc5 Mon Sep 17 00:00:00 2001 From: Gabriel Clemente Date: Fri, 28 Jun 2024 21:50:40 +0200 Subject: [PATCH 03/18] Delete config.json --- config.json | 358 ---------------------------------------------------- 1 file changed, 358 deletions(-) delete mode 100644 config.json diff --git a/config.json b/config.json deleted file mode 100644 index f32f4bf..0000000 --- a/config.json +++ /dev/null @@ -1,358 +0,0 @@ -{ - "email": "sendmessage@gabo.email", - "password": "*******,********", - "keywords": [ - "TypeScript Engineer", - "Angular Frontend", - "React Frontend", - "React Native", - "Node backend", - "JavaScript Full-Stack" - ], - "locations": [ - "Belgium", - "Netherlands", - "DACH", - "Benelux", - "United Kingdom", - "Switzerland", - "Spain", - "United States", - "European Union", - "European Economic Area", - "Germany" - ], - "driver_path": "/usr/local/bin/geckodriver", - "sortBy": "R", - "filters": { - "easy_apply": true, - "experience": [ - "Entry level", - "Associate" - ], - "jobType": [ - "Full-time", - "Contract" - ], - "timePostedRange": [ - "Past Week" - ], - "workplaceType": [ - "Remote" - ], - "less_than_10_applicants": false - }, - "experience": [ - { - "title": "Full TypeScript Stack Engineer", - "description": "As a Full-Stack TypeScript Engineer at Beyondbmi, I spearhead the development of an advanced online weight loss clinic platform. Utilizing Angular and Bootstrap for the front-end and Express with TypeORM for the back-end, I ensure consistent and reliable performance across the stack with TypeScript. My role involves implementing HIPAA-compliant encryption protocols to safeguard patient data, developing an Android application with React Native, and deploying AWS Lambda functions and AWS Cognito for secure authentication. My contributions have enhanced user experience, data security, and the platform's scalability.", - "date": "Nov 2022 - Present", - "company": "Beyondbmi" - }, - { - "title": "Software Engineer", - "description": "At GABO, I collaborate on a variety of projects, focusing on developing e-commerce sites, corporate websites, and online presences for small businesses. My work emphasizes Search Engine Optimization (SEO) to improve visibility and engagement. Using JavaScript frameworks, WordPress, PHP, and other tools, I deliver tailored, optimized web solutions. My role has honed my versatility in web development and client relationship management, ensuring long-term client satisfaction and successful project outcomes.", - "date": "Nov 2022 - Present", - "company": "GABO" - }, - { - "title": "User Interface Engineer", - "description": "During my internship at talenTeal, I led the comprehensive redesign of the company\u2019s landing page to enhance user experience (UX) and user interface (UI). My focus was on creating an intuitive and navigable website, resulting in improved accessibility and user engagement. This project demonstrated my ability to apply front-end development skills effectively to achieve significant improvements in digital interaction and user satisfaction.", - "date": "Jul 2022 - Aug 2022", - "company": "talenTeal" - }, - { - "title": "Technical Support Specialist", - "description": "At Lujo Network, I enhanced the company\u2019s security infrastructure by implementing firewalls and establishing robust backup systems. I also managed databases, developed website segments, and conducted security training sessions. My efforts improved the company\u2019s digital security framework and online presence, showcasing my ability to handle both technical support and development tasks effectively.", - "date": "Feb 2022 - Mar 2022", - "company": "Lujo Network" - }, - { - "title": "Freelancer", - "description": "I provided web solutions, applying a range of technologies to address client requirements.", - "date": "Feb 2021 - Nov 2022" - } - ], - "projects": [ - { - "title": "BEYONDBMI", - "desc": "As a Full-Stack TypeScript Engineer at Beyondbmi, I spearhead the development of an advanced online weight loss clinic platform. Utilizing Angular and Bootstrap for the front-end and Express with TypeORM for the back-end, I ensure consistent and reliable performance across the stack with TypeScript. My role involves implementing HIPAA-compliant encryption protocols to safeguard patient data, developing an Android application with React Native, and deploying AWS Lambda functions and AWS Cognito for secure authentication. My contributions have enhanced user experience, data security, and the platform's scalability.", - "link": "", - "skills": [ - "JavaScript", - "Angular", - "TypeScript", - "Bootstrap", - "React Native", - "Metro", - "AWS", - "Express", - "TypeORM", - "Postgres", - "Jest", - "CI/CD", - "Docker", - "Jira", - "Bitbucket", - "Git", - "Stripe" - ] - }, - { - "title": "GABO", - "desc": "The GABO Landing Page is a modern, visually appealing website built using the Astro framework, leveraging Solid.js for reactive UI components, Tailwind CSS for efficient styling, and Vercel for scalable hosting. This project integrates Better SQLite3 for lightweight database management, Gray Matter and Marked for markdown content handling, and Next.js with React for dynamic, interactive components. Featuring fast load times, smooth user experience, and improved SEO, the site employs Vercel Analytics and Speed Insights for monitoring performance. Key technologies include Astro, Solid.js, Tailwind CSS, Vercel, Next.js, React, Git, and GitHub.", - "link": "", - "skills": [ - "JavaScript", - "Astro", - "Solid.js", - "Tailwind CSS", - "Vercel", - "Next.js", - "React", - "TypeScript", - "Git", - "GitHub" - ] - }, - { - "title": "TALENTEAL", - "desc": "I led the comprehensive redesign of the company\u2019s landing page to enhance user experience (UX) and user interface (UI). My focus was on creating an intuitive and navigable website, resulting in improved accessibility and user engagement. This project demonstrated my ability to apply front-end development skills effectively to achieve significant improvements in digital interaction and user satisfaction.", - "link": "", - "skills": [ - "JavaScript", - "React", - "Redux", - "Django", - "UI/UX Design", - "Sass", - "Git", - "GitHub" - ] - }, - { - "title": "LUJO NETWORK", - "desc": "At Lujo Network, I led the design and development of the sign-in and sign-up pages, implementing secure forms and internationalization in several languages, along with data validation for the forms. I enhanced the company\u2019s security infrastructure by implementing firewalls and establishing robust backup systems. I also managed databases, developed website segments, and conducted security training sessions. My efforts improved the company\u2019s digital security framework and online presence, showcasing my ability to handle both technical support and development tasks effectively.", - "link": "", - "skills": [ - "JavaScript", - "HTML", - "CSS", - "Database Management", - "Cybersecurity" - ] - }, - { - "title": "EXA MONSTER", - "desc": "Exa Monster is a secure cloud storage solution that prioritizes user privacy. Developed as a SaaS application using Laravel, WordPress, and PHP, and deployed with Hetzner Cloud, it offers robust and secure storage capabilities. The platform also includes a mobile app built with React Native, providing users with seamless access to their data on the go.", - "link": "", - "skills": [ - "Laravel", - "WordPress", - "PHP", - "React Native", - "Hetzner", - "SaaS", - "Stripe" - ] - }, - { - "title": "IMALEVANTE", - "desc": "I designed and developed the Imalevante company landing page using WordPress and PHP. The project involved creating a visually appealing and functional website that effectively represents the company's brand and services.", - "link": "", - "skills": [ - "WordPress", - "PHP" - ] - }, - { - "title": "ROUTEU", - "desc": "RouteU is a fully open-sourced route management site built with the MERN stack. This project offers users the ability to manage and share routes. It is deployed on Vercel and Heroku, providing high availability and performance. The site features a modern UI developed with React, Bootstrap, and Ant Design, and it uses MongoDB Atlas for robust data management.", - "link": "https://route-u.vercel.app", - "skills": [ - "React.js", - "CSS", - "Bootstrap", - "Ant Design", - "Grommet", - "Sass", - "HTML", - "Axios", - "React Router", - "MongoDB", - "Redux", - "Express", - "Node.js" - ] - }, - { - "title": "FIGHT GAME", - "desc": "StreetFighter-like OSG (Open Sourced Game) is a simple, open-sourced fighting game inspired by Street Fighter. Developed with HTML, CSS, and Vanilla JavaScript, the game is designed for two players. It is hosted on GitHub Pages, offering easy access and a fun gaming experience.", - "link": "https://gabo-tech.github.io/StreetFighter-like-OSG", - "skills": [ - "HTML", - "CSS", - "JavaScript" - ] - }, - { - "title": "QUIZ", - "desc": "Custom Quiz is an open-sourced quiz game that uses the Open Trivia API and supports custom questions. Developed with HTML, CSS, and Vanilla JavaScript, the game offers a fun and interactive way to test knowledge on various topics. It is hosted on GitHub Pages.", - "link": "https://gabo-tech.github.io/Custom-Quizz", - "skills": [ - "HTML", - "CSS", - "JavaScript" - ] - }, - { - "title": "GABO SL", - "desc": "Gabo's Social Life is a fully open-sourced social media site built with the MERN stack. This project provides a platform for users to share and interact with content. It is deployed on Vercel and Heroku, ensuring high availability and performance. The site features modern UI components and comprehensive functionality, including user authentication, content sharing, and real-time updates.", - "link": "https://gabosl.com", - "skills": [ - "React.js", - "Sass", - "HTML", - "Axios", - "React Router", - "MongoDB", - "Redux", - "Cypress", - "Express", - "Node.js", - "Material UI", - "Swagger" - ] - }, - { - "title": "DGABO Token", - "desc": "Decentralyized GABO Token is a personal cryptocurrency project developed using JavaScript and Motoko for smart contracts. Although not deployed due to high blockchain fees, this project demonstrates the process of creating and managing a token on the Internet Computer blockchain. The project includes a web mockup and emulator setup instructions for local development.", - "link": "https://github.com/Gabo-Tech/Web3-Token-and-Faucet", - "skills": [ - "JavaScript", - "Motoko", - "HTML", - "CSS", - "React" - ] - }, - { - "title": "My Portfolio", - "desc": "This portfolio it's been designed with tailwinds and framer motion, includes several animaitons and some interactivity with background music to make the experience a bit more chilling. Has been developed with Next.js 14", - "link": "", - "skills": [ - "JavaScript", - "React", - "Next.js", - "Tailwind CSS", - "Framer Motion" - ] - }, - { - "title": "CHURCH OF JESUS CHRIST", - "desc": "This desktop application, developed using Tauri and Svelte, provides a convenient and efficient way to access and read the scriptures from the website of The Church of Jesus Christ of Latter-day Saints. The app features cross-platform compatibility (Windows, macOS, Linux), easy navigation, and a clean interface.", - "link": "https://github.com/Gabo-Tech/Scriptures-of-The-Church-of-Jesus-Christ-of-Latter-Day-Saints", - "skills": [ - "Tauri", - "Svelte", - "JavaScript", - "Node.js" - ] - } - ], - "skills": [ - "React", - "Angular", - "Svelte", - "Solid.js", - "Next.js", - "Astro", - "Tailwind CSS", - "Bootstrap", - "Ant Design", - "Material UI", - "Metro", - "React Native", - "CSS", - "HTML", - "Markdown", - "Sass", - "Grommet", - "Node.js", - "Express", - "TypeORM", - "PostgreSQL", - "Laravel", - "WordPress", - "PHP", - "Hetzner", - "Sequelize", - "Spring Boot", - "GraphQL", - "Apollo", - "JWT", - "Jest", - "Cypress", - "Playwright", - "Postman", - "Firebase", - "MongoDB", - "Redux", - "Axios", - "Swagger", - "Motoko", - "CI/CD", - "Git", - "Docker", - "Jira", - "Bitbucket", - "GitHub Actions", - "AWS", - "Vercel", - "DigitalOcean", - "Heroku", - "Netlify", - "Expo", - "Tauri", - "Recoil", - "Zustand", - "Vite", - "Vitest", - "Bun", - "MySQL", - "MariaDB", - "Mocha", - "NPM", - "Yarn", - "Webpack" - ], - "user_inputs": { - "United Kingdom": { - "City\nCity": "Valencia, Valencian Community, Spain", - "What is your gender?\nWhat is your gender?": "Male", - "Do you consider yourself to be disabled as defined by the Equality Act 2010? The Equality Act defines disability as 'A physical or mental impairment which has a substantial and long-term effect on the person's ability to carry out normal day-to-day activities'.\nDo you consider yourself to be disabled as defined by the Equality Act 2010? The Equality Act defines disability as 'A physical or mental impairment which has a substantial and long-term effect on the person's ability to carry out normal day-to-day activities'.": "No", - "Do you require any particular arrangements to support you in the recruitment and selection process?\nDo you require any particular arrangements to support you in the recruitment and selection process?\nRequired": "No", - "Please provide details of the arrangements you require. If you are invited to interview, we will confirm the arrangements with you ahead of the appointment date and time.": "No arrangements required.", - "What is your ethnic origin?\nWhat is your ethnic origin?": "White: Any other background", - "I Agree Terms & Conditions": true, - "TV Advert": false, - "CV Library": false, - "CW Jobs": false, - "Indeed": false, - "Jobsite": false, - "LinkedIn": true, - "Will you now or in the future require sponsorship for employment visa status?\nWill you now or in the future require sponsorship for employment visa status?\nRequired": "No", - "What is your current location?": "Valencia, Valencian Community, Spain", - "Have you completed the following level of education: Bachelor's Degree?\nHave you completed the following level of education: Bachelor's Degree?\nRequired": "No", - "How many years of work experience do you have with Oracle Cloud?": "0", - "How many years of work experience do you have with Oracle ERP Implementations?": "0", - "How many years of work experience do you have with Source to Pay?": "0", - "Are you legally authorized to work in United Kingdom?\nAre you legally authorized to work in United Kingdom?\nRequired": "Yes", - "Legal Name (if different than above)": "Gabriel Clemente Ramos", - "How did you hear about this job?": "LinkedIn", - "This job post is for positions in the EMEA region. Please confirm if you have the right to work in Portugal and/or UK\nThis job post is for positions in the EMEA region. Please confirm if you have the right to work in Portugal and/or UK": "Yes", - "Do you now or will you in the future require immigration sponsorship to work at Cloudflare?\nDo you now or will you in the future require immigration sponsorship to work at Cloudflare?": "No", - "Acknowledge/Confirm": true - } - } -} \ No newline at end of file From 5f0dcee6074718ff454038d6fb8f2fbcc7d8e693 Mon Sep 17 00:00:00 2001 From: Gabriel Clemente Date: Fri, 28 Jun 2024 22:20:15 +0200 Subject: [PATCH 04/18] Update README.md --- README.md | 25 ++++++++++++++++++++++--- 1 file changed, 22 insertions(+), 3 deletions(-) diff --git a/README.md b/README.md index 6375aae..da38449 100644 --- a/README.md +++ b/README.md @@ -21,8 +21,8 @@ These instructions will get you a copy of the project up and running on your loc 1. Clone the repository: ```sh - git clone https://github.com/your_username/easyapply-linkedin.git - cd easyapply-linkedin + git clone https://github.com/Gabo-Tech/EasyApply-Linkedin.git + cd EasyApply-Linkedin ``` 2. Install the necessary packages: @@ -75,6 +75,25 @@ These instructions will get you a copy of the project up and running on your loc } ``` +4. Update the locations code in the script: + ```python + LOCATION_MAPPING = { + "Switzerland": "106693272", + "Spain": "105646813", + "United States": "103644278", + "United Kingdom": "101165590", + "European Union": "91000000", + "European Economic Area": "91000002", + "DACH": "91000006", + "Benelux": "91000005", + "Netherlands": "102890719", + "Belgium":"100565514", + "Germany": "101282230" + } + ``` + This you can find the code in the geoId found in the LinkedIn url after doing a job search. + These are the right ones if you don't want to look in other places, but there are many more. + ### Usage 1. Run the application: @@ -105,4 +124,4 @@ Please feel free to comment or give suggestions/issues. Fork and submit pull req ### License -This project is licensed under the MIT License - see the [LICENSE](LICENSE) file for details. +This project is licensed under the MIT License - see the [LICENSE](/LICENSE) file for details. From ef9d1bdb0bf89d8f5f209898c011d311653f9868 Mon Sep 17 00:00:00 2001 From: Gabriel Clemente Date: Fri, 28 Jun 2024 22:37:32 +0200 Subject: [PATCH 05/18] Create requirements.txt --- requirements.txt | 17 +++++++++++++++++ 1 file changed, 17 insertions(+) create mode 100644 requirements.txt diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000..53af604 --- /dev/null +++ b/requirements.txt @@ -0,0 +1,17 @@ +attrs==23.2.0 +certifi==2024.6.2 +click==8.1.7 +exceptiongroup==1.2.1 +h11==0.14.0 +idna==3.7 +outcome==1.3.0.post0 +PySocks==1.7.1 +selenium==4.22.0 +sniffio==1.3.1 +sortedcontainers==2.4.0 +trio==0.25.1 +trio-websocket==0.11.1 +typing_extensions==4.12.2 +urllib3==2.2.2 +websocket-client==1.8.0 +wsproto==1.2.0 From bce8c6739f32f38d8118679da9c4a8eea07d95bb Mon Sep 17 00:00:00 2001 From: Gabriel Clemente Date: Fri, 28 Jun 2024 22:38:04 +0200 Subject: [PATCH 06/18] Update README.md --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index da38449..cdf7e6f 100644 --- a/README.md +++ b/README.md @@ -124,4 +124,4 @@ Please feel free to comment or give suggestions/issues. Fork and submit pull req ### License -This project is licensed under the MIT License - see the [LICENSE](/LICENSE) file for details. +This project is licensed under the MIT License - see the [LICENSE](https://github.com/Gabo-Tech/EasyApply-Linkedin/blob/master/LICENCE) file for details. From 539bfa931cfe6708097a157fd4c64d80d20b78ed Mon Sep 17 00:00:00 2001 From: Gabriel Clemente Date: Fri, 28 Jun 2024 22:42:16 +0200 Subject: [PATCH 07/18] Update .gitignore --- .gitignore | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.gitignore b/.gitignore index 802732e..daadb96 100644 --- a/.gitignore +++ b/.gitignore @@ -6,4 +6,5 @@ config.json !main.py !configExample.json !README.md -!LICENCE \ No newline at end of file +!LICENCE +!requirements.txt From 89b11c658a29bcb9bb7230f53ae7462157e26f11 Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Sun, 30 Jun 2024 02:47:35 +0200 Subject: [PATCH 08/18] added excluding filters to create more complex and specific search queries and added tests too --- .gitignore | 2 + README.md | 54 ++++++--- configExample.json | 88 ++++++++------ main.py | 296 ++++++++++++++++++++++++++++++++------------- requirements.txt | 6 + 5 files changed, 308 insertions(+), 138 deletions(-) diff --git a/.gitignore b/.gitignore index daadb96..bb768c9 100644 --- a/.gitignore +++ b/.gitignore @@ -8,3 +8,5 @@ config.json !README.md !LICENCE !requirements.txt +!e2e_tests.txt +!unit_tests.txt \ No newline at end of file diff --git a/README.md b/README.md index cdf7e6f..ca05ef7 100644 --- a/README.md +++ b/README.md @@ -15,7 +15,7 @@ These instructions will get you a copy of the project up and running on your loc 2. Selenium requires a driver to interface with the chosen browser. Make sure the driver is in your path, you will need to add your `driver_path` to the `config.json` file. - I used the Chrome driver, you can download it [here](https://sites.google.com/a/chromium.org/chromedriver/downloads). You can also download drivers for [Edge](https://developer.microsoft.com/en-us/microsoft-edge/tools/webdriver/), [Firefox](https://github.com/mozilla/geckodriver/releases), or [Safari](https://webkit.org/blog/6900/webdriver-support-in-safari-10/), depending on your preferred browser. + I used the Firefox driver, you can download it [here](https://github.com/mozilla/geckodriver/releases). You can also download drivers for [Chrome](https://sites.google.com/a/chromium.org/chromedriver/downloads), [Edge](https://developer.microsoft.com/en-us/microsoft-edge/tools/webdriver/), or [Safari](https://webkit.org/blog/6900/webdriver-support-in-safari-10/), depending on your preferred browser. ### Installation @@ -36,8 +36,9 @@ These instructions will get you a copy of the project up and running on your loc "email": "example@example.com", "password": "securePassword123!", "keywords": ["Web Developer", "JavaScript", "React"], + "keywordsToAvoid": ["C++", ".NET"], "locations": ["New York", "Los Angeles", "San Francisco"], - "driver_path": "/usr/local/bin/chromedriver", + "driver_path": "/usr/local/bin/geckodriver", "sortBy": "Alphabetical", "filters": { "easy_apply": true, @@ -77,19 +78,19 @@ These instructions will get you a copy of the project up and running on your loc 4. Update the locations code in the script: ```python - LOCATION_MAPPING = { - "Switzerland": "106693272", - "Spain": "105646813", - "United States": "103644278", - "United Kingdom": "101165590", - "European Union": "91000000", - "European Economic Area": "91000002", - "DACH": "91000006", - "Benelux": "91000005", - "Netherlands": "102890719", - "Belgium":"100565514", - "Germany": "101282230" - } + LOCATION_MAPPING = { + "Switzerland": "106693272", + "Spain": "105646813", + "United States": "103644278", + "United Kingdom": "101165590", + "European Union": "91000000", + "European Economic Area": "91000002", + "DACH": "91000006", + "Benelux": "91000005", + "Netherlands": "102890719", + "Belgium": "100565514", + "Germany": "101282230" + } ``` This you can find the code in the geoId found in the LinkedIn url after doing a job search. These are the right ones if you don't want to look in other places, but there are many more. @@ -113,15 +114,36 @@ You can customize the job search and application process by editing the `config. - **email**: Your LinkedIn email address. - **password**: Your LinkedIn password. - **keywords**: Keywords for finding specific job titles (e.g., "Machine Learning Engineer", "Data Scientist"). +- **keywordsToAvoid**: Keywords to exclude from your search. - **locations**: Locations where you are currently looking for a position. - **driver_path**: Path to your downloaded WebDriver. - **sortBy**: Sort order for job listings. - **filters**: Various filters to narrow down the job search (e.g., easy apply, experience level, job type, etc.). +### Testing + +#### Unit Tests + +Unit tests mock the Selenium WebDriver to test methods in isolation without making actual web requests. + +Run the unit tests: +```bash +python unit_tests.py +``` + +#### E2E Tests + +End-to-end tests using `pytest` and `selenium` require an actual web browser to run. + +Run the E2E tests: +```bash +pytest e2e_tests.py +``` + ### Contributing Please feel free to comment or give suggestions/issues. Fork and submit pull requests for any enhancements or bug fixes. ### License -This project is licensed under the MIT License - see the [LICENSE](https://github.com/Gabo-Tech/EasyApply-Linkedin/blob/master/LICENCE) file for details. +This project is licensed under the MIT License - see the [LICENSE](https://github.com/Gabo-Tech/EasyApply-Linkedin/blob/master/LICENCE) file for details. \ No newline at end of file diff --git a/configExample.json b/configExample.json index fd36f61..2810b50 100644 --- a/configExample.json +++ b/configExample.json @@ -1,41 +1,55 @@ { - "email": "example@example.com", - "password": "securePassword123!", - "keywords": ["Web Developer", "JavaScript", "React"], - "locations": ["New York", "Los Angeles", "San Francisco"], - "driver_path": "/usr/local/bin/chromedriver", - "sortBy": "Alphabetical", - "filters": { - "easy_apply": true, - "experience": ["Internship", "Entry Level", "Associate", "Mid-Senior Level", "Director", "Executive"], - "jobType": ["Full-Time", "Part-Time", "Contract", "Internship", "Temporary"], - "timePostedRange": ["Any Time", "Last Month", "Past Week", "Past 24 Hours"], - "workplaceType": ["Remote", "Hybrid", "On-site"], - "less_than_10_applicants": true, - "commitments": ["Full-Time", "Part-Time", "Contract", "Temporary", "Volunteer"] - }, + "email": "example@example.com", + "password": "securePassword123!", + "keywords": ["Web Developer", "JavaScript", "React"], + "keywordsToAvoid": ["C++", ".NET", "Analyst", "PHP", "Python", "C", "Java"], + "locations": ["New York", "Los Angeles", "San Francisco"], + "driver_path": "/usr/local/bin/chromedriver", + "sortBy": "Alphabetical", + "filters": { + "easy_apply": true, "experience": [ - { - "title": "Junior Web Developer", - "description": "Developing responsive web applications using JavaScript and React.", - "date": "Jan 2023 - Present", - "company": "Example Company" - } + "Internship", + "Entry Level", + "Associate", + "Mid-Senior Level", + "Director", + "Executive" ], - "projects": [ - { - "title": "Project Alpha", - "desc": "A project description here...", - "link": "#", - "skills": ["JavaScript", "React", "Node.js"] - } + "jobType": [ + "Full-Time", + "Part-Time", + "Contract", + "Internship", + "Temporary" ], - "skills": [ - "JavaScript", - "React", - "Node.js", - "Express", - "MongoDB" - ], - "user_inputs": {} - } \ No newline at end of file + "timePostedRange": ["Any Time", "Last Month", "Past Week", "Past 24 Hours"], + "workplaceType": ["Remote", "Hybrid", "On-site"], + "less_than_10_applicants": true, + "commitments": [ + "Full-Time", + "Part-Time", + "Contract", + "Temporary", + "Volunteer" + ] + }, + "experience": [ + { + "title": "Junior Web Developer", + "description": "Developing responsive web applications using JavaScript and React.", + "date": "Jan 2023 - Present", + "company": "Example Company" + } + ], + "projects": [ + { + "title": "Project Alpha", + "desc": "A project description here...", + "link": "#", + "skills": ["JavaScript", "React", "Node.js"] + } + ], + "skills": ["JavaScript", "React", "Node.js", "Express", "MongoDB"], + "user_inputs": {} +} diff --git a/main.py b/main.py index 99e0df4..aa9c644 100644 --- a/main.py +++ b/main.py @@ -9,9 +9,16 @@ from selenium.webdriver.common.keys import Keys from selenium.webdriver.support import expected_conditions as EC from selenium.webdriver.support.ui import WebDriverWait -from selenium.common.exceptions import NoSuchElementException, ElementNotInteractableException, StaleElementReferenceException, TimeoutException, ElementClickInterceptedException +from selenium.common.exceptions import ( + NoSuchElementException, + ElementNotInteractableException, + StaleElementReferenceException, + TimeoutException, + ElementClickInterceptedException, +) from selenium.webdriver.firefox.service import Service as FirefoxService + class EasyApplyLinkedin: BASE_URL = "https://www.linkedin.com/jobs/search/" ERROR_LOG_PATH = Path("error_log.json") @@ -21,7 +28,7 @@ class EasyApplyLinkedin: "Any Time": "", "Last Month": "r2592000", "Past Week": "r604800", - "Past 24 hours": "r86400" + "Past 24 hours": "r86400", } EXPERIENCE_MAPPING = { @@ -30,13 +37,13 @@ class EasyApplyLinkedin: "Associate": "3", "Mid-Senior level": "4", "Director": "5", - "Executive": "6" + "Executive": "6", } WORKPLACE_TYPE_MAPPING = { "Remote": "2", "Hybrid": "3", - "On-site": "1" + "On-site": "1", } JOB_TYPE_MAPPING = { @@ -44,7 +51,7 @@ class EasyApplyLinkedin: "Part-time": "P", "Contract": "C", "Internship": "I", - "Temporary": "T" + "Temporary": "T", } TITLE_MAPPING = { @@ -52,7 +59,7 @@ class EasyApplyLinkedin: "Developer": "25201", "Manager": "25170", "Specialist": "1456", - "Consultant": "3731" + "Consultant": "3731", } COMMITMENTS_MAPPING = { @@ -60,7 +67,7 @@ class EasyApplyLinkedin: "Part-time": "2", "Contract": "3", "Temporary": "4", - "Volunteer": "5" + "Volunteer": "5", } LOCATION_MAPPING = { @@ -73,23 +80,24 @@ class EasyApplyLinkedin: "DACH": "91000006", "Benelux": "91000005", "Netherlands": "102890719", - "Belgium":"100565514", - "Germany": "101282230" + "Belgium": "100565514", + "Germany": "101282230", } def __init__(self, data): """Initialize the EasyApplyLinkedin instance with user data.""" - self.email = data['email'] - self.password = data['password'] - self.keywords = ' OR '.join(data['keywords']) - self.locations = data['locations'] - self.filters = data['filters'] - self.sort_by = data['sortBy'] + self.email = data["email"] + self.password = data["password"] + self.keywords = " OR ".join(data["keywords"]) + self.keywords_to_avoid = " NOT ".join(data["keywordsToAvoid"]) + self.locations = data["locations"] + self.filters = data["filters"] + self.sort_by = data["sortBy"] self.context_data = data self.current_location_index = 0 - if 'user_inputs' not in self.context_data: - self.context_data['user_inputs'] = {} - firefox_service = FirefoxService(executable_path=data['driver_path']) + if "user_inputs" not in self.context_data: + self.context_data["user_inputs"] = {} + firefox_service = FirefoxService(executable_path=data["driver_path"]) self.driver = webdriver.Firefox(service=firefox_service) self.init_logging() @@ -102,13 +110,13 @@ def init_logging(self): def load_json(self, path): """Load JSON data from the specified path.""" if path.exists(): - with path.open('r') as file: + with path.open("r") as file: return json.load(file) return {} def save_json(self, path, data): """Save JSON data to the specified path.""" - with path.open('w') as file: + with path.open("w") as file: json.dump(data, file, indent=4) def log_error(self, error_msg): @@ -134,23 +142,33 @@ def log_applied_company(self, company): def cleanup_applied_companies_log(self): """Clean up logs of applied companies older than 2 weeks.""" cutoff = datetime.now() - timedelta(weeks=2) - self.applied_companies = {k: v for k, v in self.applied_companies.items() if datetime.fromisoformat(v) > cutoff} + self.applied_companies = { + k: v + for k, v in self.applied_companies.items() + if datetime.fromisoformat(v) > cutoff + } self.save_json(self.APPLIED_COMPANIES_LOG_PATH, self.applied_companies) def login_linkedin(self): """Log in to LinkedIn using the provided credentials.""" try: self.driver.get("https://www.linkedin.com/login") - WebDriverWait(self.driver, 10).until(EC.presence_of_element_located((By.NAME, 'session_key'))) - login_email = self.driver.find_element(By.NAME, 'session_key') + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.NAME, "session_key")) + ) + login_email = self.driver.find_element(By.NAME, "session_key") login_email.clear() login_email.send_keys(self.email) - WebDriverWait(self.driver, 10).until(EC.presence_of_element_located((By.NAME, 'session_password'))) - login_pass = self.driver.find_element(By.NAME, 'session_password') + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.NAME, "session_password")) + ) + login_pass = self.driver.find_element(By.NAME, "session_password") login_pass.clear() login_pass.send_keys(self.password) login_pass.send_keys(Keys.RETURN) - WebDriverWait(self.driver, 30).until(EC.presence_of_element_located((By.LINK_TEXT, 'Jobs'))) + WebDriverWait(self.driver, 30).until( + EC.presence_of_element_located((By.LINK_TEXT, "Jobs")) + ) except Exception as e: self.log_error(f"Login error: {e}") @@ -158,15 +176,31 @@ def job_search(self): """Perform job search based on keywords and locations.""" while self.current_location_index < len(self.locations): try: - WebDriverWait(self.driver, 20).until(EC.presence_of_element_located((By.LINK_TEXT, 'Jobs'))) - jobs_link = self.driver.find_element(By.LINK_TEXT, 'Jobs') + WebDriverWait(self.driver, 20).until( + EC.presence_of_element_located((By.LINK_TEXT, "Jobs")) + ) + jobs_link = self.driver.find_element(By.LINK_TEXT, "Jobs") jobs_link.click() - WebDriverWait(self.driver, 20).until(EC.presence_of_element_located((By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']"))) - search_keywords = self.driver.find_element(By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']") + WebDriverWait(self.driver, 20).until( + EC.presence_of_element_located( + (By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']") + ) + ) + search_keywords = self.driver.find_element( + By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']" + ) search_keywords.clear() search_keywords.send_keys(self.keywords) - WebDriverWait(self.driver, 20).until(EC.presence_of_element_located((By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']"))) - search_location = self.driver.find_element(By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']") + search_keywords.send_keys(" NOT ") + search_keywords.send_keys(self.keywords_to_avoid) + WebDriverWait(self.driver, 20).until( + EC.presence_of_element_located( + (By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']") + ) + ) + search_location = self.driver.find_element( + By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']" + ) search_location.clear() search_location.send_keys(self.locations[self.current_location_index]) search_keywords.click() @@ -175,7 +209,9 @@ def job_search(self): if not self.check_no_results(): break else: - print(f"No matching jobs found in {self.locations[self.current_location_index]}.") + print( + f"No matching jobs found in {self.locations[self.current_location_index]}." + ) self.current_location_index += 1 except TimeoutException: @@ -189,26 +225,34 @@ def construct_url(self): """Construct the URL for job search with applied filters.""" current_location = self.locations[self.current_location_index] params = { - "keywords": self.keywords, + "keywords": f"({self.keywords}) NOT ({self.keywords_to_avoid})", "origin": "JOB_SEARCH_PAGE_JOB_FILTER", "refresh": "true", - "sortBy": self.sort_by + "sortBy": self.sort_by, } if self.filters.get("easy_apply"): params["f_AL"] = "true" if self.filters.get("experience"): - params["f_E"] = ",".join([self.EXPERIENCE_MAPPING[exp] for exp in self.filters["experience"]]) + params["f_E"] = ",".join( + [self.EXPERIENCE_MAPPING[exp] for exp in self.filters["experience"]] + ) if self.filters.get("jobType"): - params["f_JT"] = ",".join([self.JOB_TYPE_MAPPING[jt] for jt in self.filters["jobType"]]) + params["f_JT"] = ",".join( + [self.JOB_TYPE_MAPPING[jt] for jt in self.filters["jobType"]] + ) if self.filters.get("timePostedRange"): - params["f_TPR"] = ",".join([self.TIME_POSTED_MAPPING[time] for time in self.filters["timePostedRange"]]) + params["f_TPR"] = ",".join( + [self.TIME_POSTED_MAPPING[time] for time in self.filters["timePostedRange"]] + ) if self.filters.get("workplaceType"): - params["f_WT"] = ",".join([self.WORKPLACE_TYPE_MAPPING[wt] for wt in self.filters["workplaceType"]]) + params["f_WT"] = ",".join( + [self.WORKPLACE_TYPE_MAPPING[wt] for wt in self.filters["workplaceType"]] + ) if self.filters.get("less_than_10_applicants"): params["f_EA"] = "true" @@ -235,7 +279,9 @@ def apply_filters_and_search(self): def check_no_results(self): """Check if the job search resulted in no matches.""" try: - no_results_element = self.driver.find_element(By.CSS_SELECTOR, "div.jobs-search-no-results-banner") + no_results_element = self.driver.find_element( + By.CSS_SELECTOR, "div.jobs-search-no-results-banner" + ) return no_results_element.is_displayed() except NoSuchElementException: return False @@ -243,41 +289,43 @@ def check_no_results(self): def get_response_for_label(self, label_text): """Get user response for a given label text.""" current_location = self.locations[self.current_location_index] - if current_location in self.context_data['user_inputs']: - location_specific_inputs = self.context_data['user_inputs'][current_location] + if current_location in self.context_data["user_inputs"]: + location_specific_inputs = self.context_data["user_inputs"][current_location] if label_text in location_specific_inputs: return location_specific_inputs[label_text] user_input = input(f"Please provide the answer for '{label_text}': ") - if current_location not in self.context_data['user_inputs']: - self.context_data['user_inputs'][current_location] = {} - self.context_data['user_inputs'][current_location][label_text] = user_input + if current_location not in self.context_data["user_inputs"]: + self.context_data["user_inputs"][current_location] = {} + self.context_data["user_inputs"][current_location][label_text] = user_input self.update_config_file() return user_input def get_checkbox_response_for_label(self, label_text): """Get user response for a checkbox labeled by the given text.""" current_location = self.locations[self.current_location_index] - if current_location in self.context_data['user_inputs']: - location_specific_inputs = self.context_data['user_inputs'][current_location] + if current_location in self.context_data["user_inputs"]: + location_specific_inputs = self.context_data["user_inputs"][current_location] if label_text in location_specific_inputs: return location_specific_inputs[label_text] while True: - user_input = input(f"Do you want to check the box for '{label_text}'? (yes/no): ").strip().lower() - if user_input in ['yes', 'no']: - response = user_input == 'yes' - if current_location not in self.context_data['user_inputs']: - self.context_data['user_inputs'][current_location] = {} - self.context_data['user_inputs'][current_location][label_text] = response + user_input = input( + f"Do you want to check the box for '{label_text}'? (yes/no): " + ).strip().lower() + if user_input in ["yes", "no"]: + response = user_input == "yes" + if current_location not in self.context_data["user_inputs"]: + self.context_data["user_inputs"][current_location] = {} + self.context_data["user_inputs"][current_location][label_text] = response self.update_config_file() return response def get_radio_response_for_label(self, label_text, options): """Get user response for a radio button group labeled by the given text.""" current_location = self.locations[self.current_location_index] - if current_location in self.context_data['user_inputs']: - location_specific_inputs = self.context_data['user_inputs'][current_location] + if current_location in self.context_data["user_inputs"]: + location_specific_inputs = self.context_data["user_inputs"][current_location] if label_text in location_specific_inputs: return location_specific_inputs[label_text] @@ -288,15 +336,15 @@ def get_radio_response_for_label(self, label_text, options): user_input = input("Enter the number of your choice: ").strip() if user_input.isdigit() and 1 <= int(user_input) <= len(options): response = options[int(user_input) - 1] - if current_location not in self.context_data['user_inputs']: - self.context_data['user_inputs'][current_location] = {} - self.context_data['user_inputs'][current_location][label_text] = response + if current_location not in self.context_data["user_inputs"]: + self.context_data["user_inputs"][current_location] = {} + self.context_data["user_inputs"][current_location][label_text] = response self.update_config_file() return response def update_config_file(self): """Update the configuration file with the latest user inputs.""" - with open('config.json', 'w') as config_file: + with open("config.json", "w") as config_file: json.dump(self.context_data, config_file, indent=4) def find_offers(self): @@ -310,40 +358,56 @@ def find_offers(self): EC.presence_of_element_located((By.CLASS_NAME, "scaffold-layout__list-container")) ) - job_list_container = self.driver.find_element(By.CLASS_NAME, "scaffold-layout__list-container") + job_list_container = self.driver.find_element( + By.CLASS_NAME, "scaffold-layout__list-container" + ) job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") for index in range(len(job_list_items)): try: - job_list_container = self.driver.find_element(By.CLASS_NAME, "scaffold-layout__list-container") + job_list_container = self.driver.find_element( + By.CLASS_NAME, "scaffold-layout__list-container" + ) job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") - + job_item = job_list_items[index] job_item.click() time.sleep(2) WebDriverWait(self.driver, 10).until( - EC.presence_of_element_located((By.CLASS_NAME, "jobs-search__job-details--wrapper")) + EC.presence_of_element_located( + (By.CLASS_NAME, "jobs-search__job-details--wrapper") + ) ) if self.job_already_applied(job_item): - print('Job already applied to, moving to next job...') + print("Job already applied to, moving to next job...") + self.close_application_modal() continue company_name = self.get_company_name(job_item) if company_name and company_name in self.applied_companies: - print(f"Already applied to a job at {company_name}, skipping...") + print( + f"Already applied to a job at {company_name}, skipping..." + ) + self.close_application_modal() continue - job_details_wrapper = self.driver.find_element(By.CLASS_NAME, "jobs-search__job-details--wrapper") + job_details_wrapper = self.driver.find_element( + By.CLASS_NAME, "jobs-search__job-details--wrapper" + ) try: - apply_button = job_details_wrapper.find_element(By.CSS_SELECTOR, "button.jobs-apply-button.artdeco-button--primary") + apply_button = job_details_wrapper.find_element( + By.CSS_SELECTOR, "button.jobs-apply-button.artdeco-button--primary" + ) apply_button.click() time.sleep(2) WebDriverWait(self.driver, 10).until( - EC.presence_of_element_located((By.CSS_SELECTOR, "div.jobs-easy-apply-modal")) + EC.presence_of_element_located( + (By.CSS_SELECTOR, "div.jobs-easy-apply-modal") + ) ) self.handle_easy_apply() @@ -352,17 +416,26 @@ def find_offers(self): self.log_applied_company(company_name) except NoSuchElementException: - print('No apply button found, continuing to next job...') + print("No apply button found, continuing to next job...") continue - except (NoSuchElementException, ElementNotInteractableException, StaleElementReferenceException) as e: - print(f'Exception occurred: {e}, continuing to next job...') + except ( + NoSuchElementException, + ElementNotInteractableException, + StaleElementReferenceException, + ) as e: + print(f"Exception occurred: {e}, continuing to next job...") self.log_error(f"Find offers error: {e}") continue try: - pagination_container = self.driver.find_element(By.CLASS_NAME, "artdeco-pagination__pages") - next_page_button = pagination_container.find_element(By.XPATH, "//li[contains(@class, 'artdeco-pagination__indicator') and not(contains(@class, 'active selected'))]/button") + pagination_container = self.driver.find_element( + By.CLASS_NAME, "artdeco-pagination__pages" + ) + next_page_button = pagination_container.find_element( + By.XPATH, + "//li[contains(@class, 'artdeco-pagination__indicator') and not(contains(@class, 'active selected'))]/button", + ) self.driver.execute_script("arguments[0].click();", next_page_button) time.sleep(2) except NoSuchElementException: @@ -378,7 +451,10 @@ def find_offers(self): def get_company_name(self, job_item): """Extract the company name from a job listing.""" try: - company_element = job_item.find_element(By.CSS_SELECTOR, "div.artdeco-entity-lockup__subtitle span.job-card-container__primary-description") + company_element = job_item.find_element( + By.CSS_SELECTOR, + "div.artdeco-entity-lockup__subtitle span.job-card-container__primary-description", + ) return company_element.text.strip() except NoSuchElementException: return None @@ -386,7 +462,10 @@ def get_company_name(self, job_item): def job_already_applied(self, job_item): """Check if a job has already been applied to.""" try: - applied_element = job_item.find_element(By.CSS_SELECTOR, "li.job-card-container__footer-item.job-card-container__footer-job-state.t-bold") + applied_element = job_item.find_element( + By.CSS_SELECTOR, + "li.job-card-container__footer-item.job-card-container__footer-job-state.t-bold", + ) if "Applied" in applied_element.text: return True except NoSuchElementException: @@ -399,36 +478,52 @@ def handle_easy_apply(self): while True: try: modal_dialog = WebDriverWait(self.driver, 10).until( - EC.presence_of_element_located((By.CSS_SELECTOR, "div.artdeco-modal--layer-default.jobs-easy-apply-modal")) + EC.presence_of_element_located( + (By.CSS_SELECTOR, "div.artdeco-modal--layer-default.jobs-easy-apply-modal") + ) ) try: - next_button = modal_dialog.find_element(By.CSS_SELECTOR, "button[data-easy-apply-next-button]") + next_button = modal_dialog.find_element( + By.CSS_SELECTOR, "button[data-easy-apply-next-button]" + ) self.driver.execute_script("arguments[0].click();", next_button) time.sleep(2) except NoSuchElementException: try: - review_button = modal_dialog.find_element(By.CSS_SELECTOR, "button[aria-label='Review your application']") + review_button = modal_dialog.find_element( + By.CSS_SELECTOR, "button[aria-label='Review your application']" + ) self.driver.execute_script("arguments[0].click();", review_button) time.sleep(2) except NoSuchElementException: try: - submit_button = modal_dialog.find_element(By.CSS_SELECTOR, "button[aria-label='Submit application']") + submit_button = modal_dialog.find_element( + By.CSS_SELECTOR, "button[aria-label='Submit application']" + ) self.driver.execute_script("arguments[0].click();", submit_button) time.sleep(2) print("Application submitted.") self.handle_done_button() break except NoSuchElementException: - print('Submit button not found, continuing to next job...') + print("Submit button not found, continuing to next job...") + self.close_application_modal() break self.fill_form(modal_dialog) except TimeoutException: - print('No more steps found, exiting...') + print("No more steps found, exiting...") + break + except Exception as e: + print(f"Error during easy apply: {e}, skipping to next job...") + self.log_error(f"Easy apply error: {e}") + self.close_application_modal() break def fill_form(self, modal_dialog): """Fill out the application form.""" - form_elements = modal_dialog.find_elements(By.CSS_SELECTOR, "div[data-test-form-element]") + form_elements = modal_dialog.find_elements( + By.CSS_SELECTOR, "div[data-test-form-element], fieldset[data-test-form-builder-radio-button-form-component], fieldset[data-test-checkbox-form-component]" + ) for element in form_elements: try: label = element.find_element(By.CSS_SELECTOR, "label, legend") @@ -496,7 +591,7 @@ def fill_form(self, modal_dialog): next_button.click() time.sleep(2) except NoSuchElementException: - print('Next button not found, form might be complete or there is an issue.') + print("Next button not found, form might be complete or there is an issue.") def handle_done_button(self): """Handle the final done button after application submission.""" @@ -509,9 +604,39 @@ def handle_done_button(self): except TimeoutException: print("Done button not found, skipping to next job.") + def close_application_modal(self): + """Close the application modal.""" + try: + close_button = WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located( + ( + By.CSS_SELECTOR, + "button.artdeco-button.artdeco-button--circle.artdeco-button--muted.artdeco-button--2.artdeco-button--tertiary.artdeco-modal__dismiss", + ) + ) + ) + close_button.click() + time.sleep(2) + self.handle_discard_dialog() + except TimeoutException: + print("Close button not found, skipping to next job.") + + def handle_discard_dialog(self): + """Handle the discard dialog when closing the application modal.""" + try: + discard_button = WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located( + (By.CSS_SELECTOR, "button[data-control-name='discard_application_confirm_btn']") + ) + ) + discard_button.click() + time.sleep(2) + except TimeoutException: + print("Discard button not found, skipping to next job.") + def close_session(self): """Close the browser session.""" - print('End of the session') + print("End of the session") self.driver.close() self.driver.quit() @@ -520,8 +645,9 @@ def handle_captcha(self): print("CAPTCHA detected. Please solve the CAPTCHA manually and then press Enter to continue...") input() + if __name__ == "__main__": - with open('config.json') as config_file: + with open("config.json") as config_file: data = json.load(config_file) bot = EasyApplyLinkedin(data) bot.login_linkedin() diff --git a/requirements.txt b/requirements.txt index 53af604..4ebcdf2 100644 --- a/requirements.txt +++ b/requirements.txt @@ -15,3 +15,9 @@ typing_extensions==4.12.2 urllib3==2.2.2 websocket-client==1.8.0 wsproto==1.2.0 +iniconfig==1.1.1 +packaging==21.0 +pluggy==0.13.1 +py==1.10.0 +pyparsing==2.4.7 +pytest==6.2.4 From e61c848bc9de04bb3872bf0a8cff5a3b1ed8206f Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Sun, 30 Jun 2024 02:48:24 +0200 Subject: [PATCH 09/18] added excluding filters to create more complex and specific search queries and added tests too --- .gitignore | 4 ++-- e2e_tests.py | 52 ++++++++++++++++++++++++++++++++++++++++++++++++ unit_tests.py | 55 +++++++++++++++++++++++++++++++++++++++++++++++++++ 3 files changed, 109 insertions(+), 2 deletions(-) create mode 100644 e2e_tests.py create mode 100644 unit_tests.py diff --git a/.gitignore b/.gitignore index bb768c9..08a27fb 100644 --- a/.gitignore +++ b/.gitignore @@ -8,5 +8,5 @@ config.json !README.md !LICENCE !requirements.txt -!e2e_tests.txt -!unit_tests.txt \ No newline at end of file +!e2e_tests.py +!unit_tests.py \ No newline at end of file diff --git a/e2e_tests.py b/e2e_tests.py new file mode 100644 index 0000000..67293a0 --- /dev/null +++ b/e2e_tests.py @@ -0,0 +1,52 @@ +import pytest +from selenium import webdriver +from selenium.webdriver.firefox.service import Service as FirefoxService +from easy_apply_linkedin import EasyApplyLinkedin + +@pytest.fixture +def setup_browser(): + service = FirefoxService(executable_path="/usr/local/bin/geckodriver") + driver = webdriver.Firefox(service=service) + yield driver + driver.quit() + +@pytest.fixture +def setup_bot(setup_browser): + data = { + "email": "sendmessage@gabo.email", + "password": "bp8v9fvk#?QaKe7", + "keywords": ["TypeScript", "Angular", "React"], + "keywordsToAvoid": ["C++", ".NET"], + "locations": ["Switzerland", "Belgium"], + "driver_path": "/usr/local/bin/geckodriver", + "sortBy": "R", + "filters": { + "easy_apply": True, + "experience": [], + "jobType": ["Full-time", "Contract"], + "timePostedRange": [], + "workplaceType": ["Remote", "Hybrid"], + "less_than_10_applicants": False + } + } + bot = EasyApplyLinkedin(data) + bot.driver = setup_browser + return bot + +def test_login_linkedin(setup_bot): + setup_bot.login_linkedin() + assert "feed" in setup_bot.driver.current_url + +def test_job_search(setup_bot): + setup_bot.login_linkedin() + setup_bot.job_search() + assert "jobs/search" in setup_bot.driver.current_url + +def test_find_offers(setup_bot): + setup_bot.login_linkedin() + setup_bot.job_search() + setup_bot.find_offers() + assert len(setup_bot.applied_companies) > 0 + +if __name__ == "__main__": + pytest.main() diff --git a/unit_tests.py b/unit_tests.py new file mode 100644 index 0000000..0401d34 --- /dev/null +++ b/unit_tests.py @@ -0,0 +1,55 @@ +import unittest +from unittest.mock import patch, MagicMock +from easy_apply_linkedin import EasyApplyLinkedin + +class TestEasyApplyLinkedin(unittest.TestCase): + def setUp(self): + self.data = { + "email": "sendmessage@gabo.email", + "password": "bp8v9fvk#?QaKe7", + "keywords": ["TypeScript", "Angular", "React"], + "keywordsToAvoid": ["C++", ".NET"], + "locations": ["Switzerland", "Belgium"], + "driver_path": "/usr/local/bin/geckodriver", + "sortBy": "R", + "filters": { + "easy_apply": True, + "experience": [], + "jobType": ["Full-time", "Contract"], + "timePostedRange": [], + "workplaceType": ["Remote", "Hybrid"], + "less_than_10_applicants": False + } + } + self.bot = EasyApplyLinkedin(self.data) + + @patch('easy_apply_linkedin.webdriver.Firefox') + def test_login_linkedin(self, MockWebDriver): + mock_driver = MockWebDriver.return_value + mock_driver.find_element.return_value = MagicMock() + self.bot.login_linkedin() + mock_driver.get.assert_called_with("https://www.linkedin.com/login") + self.assertTrue(mock_driver.find_element.called) + + @patch('easy_apply_linkedin.webdriver.Firefox') + def test_construct_url(self, MockWebDriver): + url = self.bot.construct_url() + self.assertIn("keywords=TypeScript%20OR%20Angular%20OR%20React", url) + self.assertIn("geoId=106693272", url) + self.assertIn("f_AL=true", url) + + @patch('easy_apply_linkedin.webdriver.Firefox') + def test_apply_filters_and_search_no_results(self, MockWebDriver): + mock_driver = MockWebDriver.return_value + mock_driver.find_element.side_effect = NoSuchElementException + self.bot.apply_filters_and_search() + self.assertEqual(self.bot.current_location_index, 1) + + @patch('easy_apply_linkedin.webdriver.Firefox') + def test_log_error(self, MockWebDriver): + self.bot.log_error("Test error") + errors = self.bot.load_json(self.bot.ERROR_LOG_PATH) + self.assertTrue(any("Test error" in v for v in errors.values())) + +if __name__ == "__main__": + unittest.main() From 8ebd677455c21f459a1c8556763a54cb62aca2f3 Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Thu, 4 Jul 2024 00:39:30 +0200 Subject: [PATCH 10/18] pagination bug solved last stable version --- configExample.json | 138 ++++++++++++++++++++++++------------ main.py | 173 +++++++++++++++++++++++++++------------------ requirements.txt | 4 ++ 3 files changed, 201 insertions(+), 114 deletions(-) diff --git a/configExample.json b/configExample.json index 2810b50..3d533a0 100644 --- a/configExample.json +++ b/configExample.json @@ -1,55 +1,103 @@ { - "email": "example@example.com", - "password": "securePassword123!", - "keywords": ["Web Developer", "JavaScript", "React"], - "keywordsToAvoid": ["C++", ".NET", "Analyst", "PHP", "Python", "C", "Java"], - "locations": ["New York", "Los Angeles", "San Francisco"], - "driver_path": "/usr/local/bin/chromedriver", - "sortBy": "Alphabetical", + "email": "your_email@example.com", + "password": "your_secure_password", + "keywords": [ + "keyword1", + "keyword2", + "keyword3" + ], + "keywordsToAvoid": [ + "keyword1_to_avoid", + "keyword2_to_avoid", + "keyword3_to_avoid" + ], + "locations": [ + "location1", + "location2", + "location3" + ], + "driver_path": "path/to/driver", + "sortBy": "sort_preference", "filters": { "easy_apply": true, + "experience": [], + "jobType": ["job_type1", "job_type2"], + "timePostedRange": [], + "workplaceType": ["type1", "type2"], + "less_than_10_applicants": false + }, + "aiContext": { + "preferences": { + "workplaceType": "preference1", + "workplaceTypeAlternative": ["alternative1", "alternative2"], + "jobType": "preference2", + "jobTypeAlternative": ["alternative3", "alternative4"], + "prereferredEnd": "preference3", + "prereferredEndAlternative": ["alternative5", "alternative6"] + }, "experience": [ - "Internship", - "Entry Level", - "Associate", - "Mid-Senior Level", - "Director", - "Executive" + { + "title": "job_title", + "description": "job_description", + "date": "date_range", + "company": "company_name", + "location": "location", + "skills": [ + "skill1", + "skill2", + "skill3" + ] + } ], - "jobType": [ - "Full-Time", - "Part-Time", - "Contract", - "Internship", - "Temporary" + "education": [ + { + "title": "education_title", + "description": "education_description", + "date": "date_range", + "company": "institution_name", + "skills": [ + "skill1", + "skill2", + "skill3" + ] + }, + { + "title": "certification_title", + "description": "certification_description", + "date": "date_range", + "company": "certifying_body", + "skills": [ + "skill1", + "skill2", + "skill3" + ] + } ], - "timePostedRange": ["Any Time", "Last Month", "Past Week", "Past 24 Hours"], - "workplaceType": ["Remote", "Hybrid", "On-site"], - "less_than_10_applicants": true, - "commitments": [ - "Full-Time", - "Part-Time", - "Contract", - "Temporary", - "Volunteer" + "projects": [ + { + "name": "project_name", + "description": "project_description", + "technologies": [ + "technology1", + "technology2", + "technology3" + ] + } + ], + "skills": [ + "skill1", + "skill2", + "skill3" ] }, - "experience": [ - { - "title": "Junior Web Developer", - "description": "Developing responsive web applications using JavaScript and React.", - "date": "Jan 2023 - Present", - "company": "Example Company" - } - ], - "projects": [ - { - "title": "Project Alpha", - "desc": "A project description here...", - "link": "#", - "skills": ["JavaScript", "React", "Node.js"] + "user_inputs": { + "country1": { + "field1": "value1", + "field2": "value2" + }, + "country2": { + "field1": "value1", + "field2": "value2" } - ], - "skills": ["JavaScript", "React", "Node.js", "Express", "MongoDB"], - "user_inputs": {} + } } diff --git a/main.py b/main.py index aa9c644..4e4a6cf 100644 --- a/main.py +++ b/main.py @@ -23,6 +23,7 @@ class EasyApplyLinkedin: BASE_URL = "https://www.linkedin.com/jobs/search/" ERROR_LOG_PATH = Path("error_log.json") APPLIED_COMPANIES_LOG_PATH = Path("applied_companies_log.json") + FAILED_APPLICATIONS_LOG_PATH = Path("failed_applications_log.json") TIME_POSTED_MAPPING = { "Any Time": "", @@ -103,9 +104,10 @@ def __init__(self, data): def init_logging(self): """Initialize logging for error and applied companies.""" - logging.basicConfig(level=logging.ERROR) + logging.basicConfig(level=logging.INFO) self.error_logger = logging.getLogger("ErrorLogger") self.applied_companies = self.load_json(self.APPLIED_COMPANIES_LOG_PATH) + self.failed_applications = self.load_json(self.FAILED_APPLICATIONS_LOG_PATH) def load_json(self, path): """Load JSON data from the specified path.""" @@ -121,11 +123,16 @@ def save_json(self, path, data): def log_error(self, error_msg): """Log error messages with a timestamp.""" + self.error_logger.error(error_msg) errors = self.load_json(self.ERROR_LOG_PATH) errors[str(datetime.now())] = error_msg self.save_json(self.ERROR_LOG_PATH, errors) self.cleanup_error_log() + def log_info(self, message): + """Log informational messages.""" + logging.info(message) + def cleanup_error_log(self): """Clean up old error logs older than 1 day.""" errors = self.load_json(self.ERROR_LOG_PATH) @@ -149,6 +156,22 @@ def cleanup_applied_companies_log(self): } self.save_json(self.APPLIED_COMPANIES_LOG_PATH, self.applied_companies) + def log_failed_application(self, company): + """Log the company where application failed.""" + self.failed_applications[company] = str(datetime.now()) + self.save_json(self.FAILED_APPLICATIONS_LOG_PATH, self.failed_applications) + self.cleanup_failed_applications_log() + + def cleanup_failed_applications_log(self): + """Clean up logs of failed applications older than 2 weeks.""" + cutoff = datetime.now() - timedelta(weeks=2) + self.failed_applications = { + k: v + for k, v in self.failed_applications.items() + if datetime.fromisoformat(v) > cutoff + } + self.save_json(self.FAILED_APPLICATIONS_LOG_PATH, self.failed_applications) + def login_linkedin(self): """Log in to LinkedIn using the provided credentials.""" try: @@ -209,13 +232,11 @@ def job_search(self): if not self.check_no_results(): break else: - print( - f"No matching jobs found in {self.locations[self.current_location_index]}." - ) + self.log_info(f"No matching jobs found in {self.locations[self.current_location_index]}.") self.current_location_index += 1 except TimeoutException: - print("Timeout while trying to access the Jobs page or elements on it.") + self.log_info("Timeout while trying to access the Jobs page or elements on it.") self.current_location_index += 1 except Exception as e: self.log_error(f"Job search error: {e}") @@ -271,7 +292,7 @@ def apply_filters_and_search(self): self.driver.get(search_url) if self.check_no_results(): - print(f"No matching jobs found in {self.locations[self.current_location_index]}.") + self.log_info(f"No matching jobs found in {self.locations[self.current_location_index]}.") self.current_location_index += 1 else: break @@ -286,6 +307,15 @@ def check_no_results(self): except NoSuchElementException: return False + def find_element_with_retry(self, by, value, retries=3, delay=2): + """Find an element with retry logic.""" + for _ in range(retries): + try: + return self.driver.find_element(by, value) + except (NoSuchElementException, StaleElementReferenceException): + time.sleep(delay) + raise NoSuchElementException(f"Element not found: {by}, {value}") + def get_response_for_label(self, label_text): """Get user response for a given label text.""" current_location = self.locations[self.current_location_index] @@ -310,9 +340,7 @@ def get_checkbox_response_for_label(self, label_text): return location_specific_inputs[label_text] while True: - user_input = input( - f"Do you want to check the box for '{label_text}'? (yes/no): " - ).strip().lower() + user_input = input(f"Do you want to check the box for '{label_text}'? (yes/no): ").strip().lower() if user_input in ["yes", "no"]: response = user_input == "yes" if current_location not in self.context_data["user_inputs"]: @@ -341,6 +369,23 @@ def get_radio_response_for_label(self, label_text, options): self.context_data["user_inputs"][current_location][label_text] = response self.update_config_file() return response + else: + print("Invalid input, please try again.") + + def get_file_response_for_label(self, label_text): + """Get user response for a file upload labeled by the given text.""" + current_location = self.locations[self.current_location_index] + if current_location in self.context_data["user_inputs"]: + location_specific_inputs = self.context_data["user_inputs"][current_location] + if label_text in location_specific_inputs: + return location_specific_inputs[label_text] + + user_input = input(f"Please provide the file location for '{label_text}': ") + if current_location not in self.context_data["user_inputs"]: + self.context_data["user_inputs"][current_location] = {} + self.context_data["user_inputs"][current_location][label_text] = user_input + self.update_config_file() + return user_input def update_config_file(self): """Update the configuration file with the latest user inputs.""" @@ -351,6 +396,8 @@ def find_offers(self): """Find and apply to job offers.""" while self.current_location_index < len(self.locations): self.apply_filters_and_search() + + current_page = 1 while True: try: @@ -358,20 +405,27 @@ def find_offers(self): EC.presence_of_element_located((By.CLASS_NAME, "scaffold-layout__list-container")) ) - job_list_container = self.driver.find_element( - By.CLASS_NAME, "scaffold-layout__list-container" - ) + job_list_container = self.find_element_with_retry(By.CLASS_NAME, "scaffold-layout__list-container") job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") for index in range(len(job_list_items)): try: - job_list_container = self.driver.find_element( - By.CLASS_NAME, "scaffold-layout__list-container" - ) + job_list_container = self.find_element_with_retry(By.CLASS_NAME, "scaffold-layout__list-container") job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") job_item = job_list_items[index] - job_item.click() + + # Scroll the element into view + self.driver.execute_script("arguments[0].scrollIntoView(true);", job_item) + time.sleep(1) + + try: + # Attempt to click the element with JavaScript + self.driver.execute_script("arguments[0].click();", job_item) + except ElementClickInterceptedException: + self.log_info("Element click intercepted, skipping to next job...") + continue + time.sleep(2) WebDriverWait(self.driver, 10).until( @@ -380,22 +434,14 @@ def find_offers(self): ) ) - if self.job_already_applied(job_item): - print("Job already applied to, moving to next job...") - self.close_application_modal() - continue - company_name = self.get_company_name(job_item) - if company_name and company_name in self.applied_companies: - print( - f"Already applied to a job at {company_name}, skipping..." - ) + + if company_name in self.applied_companies: + self.log_info(f"Already applied to a job at {company_name}, skipping...") self.close_application_modal() continue - job_details_wrapper = self.driver.find_element( - By.CLASS_NAME, "jobs-search__job-details--wrapper" - ) + job_details_wrapper = self.find_element_with_retry(By.CLASS_NAME, "jobs-search__job-details--wrapper") try: apply_button = job_details_wrapper.find_element( @@ -410,44 +456,42 @@ def find_offers(self): ) ) - self.handle_easy_apply() - - if company_name: + try: + self.handle_easy_apply() self.log_applied_company(company_name) + except Exception as e: + self.log_info(f"Failed to apply at {company_name}: {str(e)}") + self.log_failed_application(company_name) except NoSuchElementException: - print("No apply button found, continuing to next job...") + self.log_info("No apply button found, continuing to next job...") continue - except ( - NoSuchElementException, - ElementNotInteractableException, - StaleElementReferenceException, - ) as e: - print(f"Exception occurred: {e}, continuing to next job...") + except (NoSuchElementException, ElementNotInteractableException, StaleElementReferenceException) as e: + self.log_info(f"Exception occurred: {e}, continuing to next job...") self.log_error(f"Find offers error: {e}") continue try: - pagination_container = self.driver.find_element( - By.CLASS_NAME, "artdeco-pagination__pages" - ) + pagination_container = self.find_element_with_retry(By.CLASS_NAME, "artdeco-pagination__pages") next_page_button = pagination_container.find_element( By.XPATH, - "//li[contains(@class, 'artdeco-pagination__indicator') and not(contains(@class, 'active selected'))]/button", + f"//button[@aria-label='Page {current_page + 1}']", ) self.driver.execute_script("arguments[0].click();", next_page_button) time.sleep(2) + current_page += 1 except NoSuchElementException: - print("No more pages left.") + self.log_info("No more pages left.") break except TimeoutException: - print("Timeout while waiting for job list container.") + self.log_info("Timeout while waiting for job list container.") self.log_error("Timeout while waiting for job list container.") break self.current_location_index += 1 + def get_company_name(self, job_item): """Extract the company name from a job listing.""" try: @@ -459,20 +503,6 @@ def get_company_name(self, job_item): except NoSuchElementException: return None - def job_already_applied(self, job_item): - """Check if a job has already been applied to.""" - try: - applied_element = job_item.find_element( - By.CSS_SELECTOR, - "li.job-card-container__footer-item.job-card-container__footer-job-state.t-bold", - ) - if "Applied" in applied_element.text: - return True - except NoSuchElementException: - pass - - return False - def handle_easy_apply(self): """Handle the easy apply process.""" while True: @@ -502,19 +532,19 @@ def handle_easy_apply(self): ) self.driver.execute_script("arguments[0].click();", submit_button) time.sleep(2) - print("Application submitted.") + self.log_info("Application submitted.") self.handle_done_button() break except NoSuchElementException: - print("Submit button not found, continuing to next job...") + self.log_info("Submit button not found, continuing to next job...") self.close_application_modal() break self.fill_form(modal_dialog) except TimeoutException: - print("No more steps found, exiting...") + self.log_info("No more steps found, exiting...") break except Exception as e: - print(f"Error during easy apply: {e}, skipping to next job...") + self.log_info(f"Error during easy apply: {e}, skipping to next job...") self.log_error(f"Easy apply error: {e}") self.close_application_modal() break @@ -583,6 +613,12 @@ def fill_form(self, modal_dialog): self.driver.execute_script("arguments[0].click();", radio) break + elif input_field.tag_name == "input" and input_field.get_attribute("type") == "file": + # Handle file upload + response = self.get_file_response_for_label(label_text) + input_field.send_keys(response) + time.sleep(1) + except NoSuchElementException: continue @@ -591,7 +627,7 @@ def fill_form(self, modal_dialog): next_button.click() time.sleep(2) except NoSuchElementException: - print("Next button not found, form might be complete or there is an issue.") + self.log_info("Next button not found, form might be complete or there is an issue.") def handle_done_button(self): """Handle the final done button after application submission.""" @@ -602,7 +638,7 @@ def handle_done_button(self): done_button.click() time.sleep(2) except TimeoutException: - print("Done button not found, skipping to next job.") + self.log_info("Done button not found, skipping to next job.") def close_application_modal(self): """Close the application modal.""" @@ -619,7 +655,7 @@ def close_application_modal(self): time.sleep(2) self.handle_discard_dialog() except TimeoutException: - print("Close button not found, skipping to next job.") + self.log_info("Close button not found, skipping to next job.") def handle_discard_dialog(self): """Handle the discard dialog when closing the application modal.""" @@ -632,18 +668,17 @@ def handle_discard_dialog(self): discard_button.click() time.sleep(2) except TimeoutException: - print("Discard button not found, skipping to next job.") + self.log_info("Discard button not found, skipping to next job.") def close_session(self): """Close the browser session.""" - print("End of the session") + self.log_info("End of the session") self.driver.close() self.driver.quit() def handle_captcha(self): """Handle CAPTCHA prompts manually.""" - print("CAPTCHA detected. Please solve the CAPTCHA manually and then press Enter to continue...") - input() + input("CAPTCHA detected. Please solve the CAPTCHA manually and then press Enter to continue...") if __name__ == "__main__": diff --git a/requirements.txt b/requirements.txt index 4ebcdf2..fa05aa0 100644 --- a/requirements.txt +++ b/requirements.txt @@ -21,3 +21,7 @@ pluggy==0.13.1 py==1.10.0 pyparsing==2.4.7 pytest==6.2.4 +transformers==4.28.1 +torch==2.0.1 +langdetect==1.0.9 +googletrans==4.0.0-rc1 From 38f5dae084c4b9ec40c917c211058fa372843370 Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Thu, 4 Jul 2024 17:18:54 +0200 Subject: [PATCH 11/18] Bugs solved --- main.py | 1 - 1 file changed, 1 deletion(-) diff --git a/main.py b/main.py index 4e4a6cf..75c06d6 100644 --- a/main.py +++ b/main.py @@ -491,7 +491,6 @@ def find_offers(self): self.current_location_index += 1 - def get_company_name(self, job_item): """Extract the company name from a job listing.""" try: From f9fd28af688d756ee1ee1bc0100caf9c025e8789 Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Thu, 4 Jul 2024 20:46:02 +0200 Subject: [PATCH 12/18] bugs troubleshoot it last working version --- README.md | 62 ++++------- configExample.json | 267 ++++++++++++++++++++++++++++++--------------- e2e_tests.py | 75 +++++++++++-- main.py | 18 +-- 4 files changed, 277 insertions(+), 145 deletions(-) diff --git a/README.md b/README.md index ca05ef7..4ba0d6a 100644 --- a/README.md +++ b/README.md @@ -8,7 +8,7 @@ These instructions will get you a copy of the project up and running on your loc ### Prerequisites -1. Install selenium. I used `pip` to install the selenium package. +1. Install Selenium. Use `pip` to install the Selenium package: ```sh pip install selenium ``` @@ -39,62 +39,38 @@ These instructions will get you a copy of the project up and running on your loc "keywordsToAvoid": ["C++", ".NET"], "locations": ["New York", "Los Angeles", "San Francisco"], "driver_path": "/usr/local/bin/geckodriver", - "sortBy": "Alphabetical", + "sortBy": "R", "filters": { "easy_apply": true, - "experience": ["Internship", "Entry Level", "Associate", "Mid-Senior Level", "Director", "Executive"], - "jobType": ["Full-Time", "Part-Time", "Contract", "Internship", "Temporary"], - "timePostedRange": ["Any Time", "Last Month", "Past Week", "Past 24 Hours"], + "experience": ["Internship", "Entry level", "Associate", "Mid-Senior level", "Director", "Executive"], + "jobType": ["Full-time", "Part-time", "Contract", "Internship", "Temporary"], + "timePostedRange": ["Any Time", "Last Month", "Past Week", "Past 24 hours"], "workplaceType": ["Remote", "Hybrid", "On-site"], - "less_than_10_applicants": true, - "commitments": ["Full-Time", "Part-Time", "Contract", "Temporary", "Volunteer"] - }, - "experience": [ - { - "title": "Junior Web Developer", - "description": "Developing responsive web applications using JavaScript and React.", - "date": "Jan 2023 - Present", - "company": "Example Company" - } - ], - "projects": [ - { - "title": "Project Alpha", - "desc": "A project description here...", - "link": "#", - "skills": ["JavaScript", "React", "Node.js"] - } - ], - "skills": [ - "JavaScript", - "React", - "Node.js", - "Express", - "MongoDB" - ], - "user_inputs": {} + "less_than_10_applicants": true + } } ``` -4. Update the locations code in the script: +4. Update the location codes in the script: ```python LOCATION_MAPPING = { + "Canada": "101174742", + "Portugal": "100364837", "Switzerland": "106693272", - "Spain": "105646813", "United States": "103644278", - "United Kingdom": "101165590", - "European Union": "91000000", - "European Economic Area": "91000002", + "Belgium": "100565514", + "Netherlands": "102890719", "DACH": "91000006", "Benelux": "91000005", - "Netherlands": "102890719", - "Belgium": "100565514", - "Germany": "101282230" + "European Union": "91000000", + "European Economic Area": "91000002", + "Germany": "101282230", + "Spain": "105646813", + "United Kingdom": "101165590" } ``` - This you can find the code in the geoId found in the LinkedIn url after doing a job search. - These are the right ones if you don't want to look in other places, but there are many more. - + You can find the code in the `geoId` found in the LinkedIn URL after doing a job search. These are the correct ones if you don't want to search elsewhere, but there are many more. + ### Usage 1. Run the application: diff --git a/configExample.json b/configExample.json index 3d533a0..01c3f67 100644 --- a/configExample.json +++ b/configExample.json @@ -1,103 +1,194 @@ { - "email": "your_email@example.com", - "password": "your_secure_password", + "email": "example@domain.com", + "password": "YourSecurePassword123!", "keywords": [ - "keyword1", - "keyword2", - "keyword3" + "TypeScript", + "Angular", + "React", + "React Native", + "Node", + "JavaScript", + "Frontend Engineer", + "Full-Stack Engineer", + "Backend Engineer" ], "keywordsToAvoid": [ - "keyword1_to_avoid", - "keyword2_to_avoid", - "keyword3_to_avoid" + "C++", + ".NET", + "Analyst", + "PHP", + "Python", + "C", + "Java", + "Go", + "Rust", + "Kotlin", + "Swift", + "Objective-C", + "Robotic", + "Data", + "Science", + "Cloud", + "AI", + "ML", + "DL", + "NLP", + "CV", + "DevOps", + "Solidity" ], "locations": [ - "location1", - "location2", - "location3" + "Canada", + "Portugal", + "Switzerland", + "Belgium", + "Netherlands", + "DACH", + "Benelux", + "European Union", + "European Economic Area", + "Germany", + "Spain", + "United States", + "United Kingdom" ], - "driver_path": "path/to/driver", - "sortBy": "sort_preference", + "driver_path": "/path/to/geckodriver", + "sortBy": "R", "filters": { - "easy_apply": true, - "experience": [], - "jobType": ["job_type1", "job_type2"], - "timePostedRange": [], - "workplaceType": ["type1", "type2"], - "less_than_10_applicants": false + "easy_apply": true, + "experience": [], + "jobType": [ + "Full-time", + "Contract" + ], + "timePostedRange": [], + "workplaceType": [ + "Remote", + "Hybrid" + ], + "less_than_10_applicants": false }, "aiContext": { - "preferences": { - "workplaceType": "preference1", - "workplaceTypeAlternative": ["alternative1", "alternative2"], - "jobType": "preference2", - "jobTypeAlternative": ["alternative3", "alternative4"], - "prereferredEnd": "preference3", - "prereferredEndAlternative": ["alternative5", "alternative6"] - }, - "experience": [ - { - "title": "job_title", - "description": "job_description", - "date": "date_range", - "company": "company_name", - "location": "location", - "skills": [ - "skill1", - "skill2", - "skill3" - ] - } - ], - "education": [ - { - "title": "education_title", - "description": "education_description", - "date": "date_range", - "company": "institution_name", - "skills": [ - "skill1", - "skill2", - "skill3" - ] + "preferences": { + "workplaceType": "Remote", + "workplaceTypeAlternative": [ + "Hybrid" + ], + "jobType": "Contract", + "jobTypeAlternative": [ + "Full-time" + ], + "prereferredEnd": "Backend", + "prereferredEndAlternative": [ + "Full-Stack", + "Frontend" + ] }, - { - "title": "certification_title", - "description": "certification_description", - "date": "date_range", - "company": "certifying_body", - "skills": [ - "skill1", - "skill2", - "skill3" - ] - } - ], - "projects": [ - { - "name": "project_name", - "description": "project_description", - "technologies": [ - "technology1", - "technology2", - "technology3" - ] - } - ], - "skills": [ - "skill1", - "skill2", - "skill3" - ] + "currentLocation": "Fake City, Country", + "willingToRelocate": true, + "experience": [ + { + "title": "Full-Stack Developer", + "description": "Developed an e-commerce platform using MERN stack.", + "date": "Jan 2021 - Present", + "company": "Tech Solutions", + "location": "Remote", + "skills": [ + "TypeScript", + "React", + "Node.js", + "Express.js", + "MongoDB" + ] + }, + { + "title": "Frontend Engineer", + "description": "Designed and implemented user interfaces with Angular.", + "date": "Jun 2019 - Dec 2020", + "company": "Web Creators", + "location": "San Francisco, CA", + "skills": [ + "JavaScript", + "Angular", + "HTML", + "CSS" + ] + } + ], + "education": [ + { + "title": "Bachelor of Science - Computer Science", + "description": "Studied various aspects of computer science, including algorithms, data structures, and web development.", + "date": "Sep 2015 - Jun 2019", + "company": "University of Somewhere", + "skills": [ + "Algorithms", + "Data Structures", + "Web Development", + "Machine Learning" + ] + } + ], + "projects": [ + { + "name": "Project Alpha", + "description": "A project management tool developed using React and Node.js.", + "technologies": [ + "React", + "Node.js", + "Express", + "MongoDB", + "Docker" + ] + } + ], + "skills": [ + "TypeScript", + "JavaScript", + "Angular", + "React", + "Node.js", + "Express.js", + "MongoDB", + "HTML", + "CSS" + ] }, "user_inputs": { - "country1": { - "field1": "value1", - "field2": "value2" - }, - "country2": { - "field1": "value1", - "field2": "value2" - } + "United States": { + "City\nCity": "Fake City, USA", + "What is your gender?\nWhat is your gender?": "Prefer not to say", + "Do you consider yourself to be disabled as defined by the Equality Act 2010?": "No", + "Do you require any particular arrangements to support you in the recruitment and selection process?": "No", + "What is your ethnic origin?\nWhat is your ethnic origin?": "White", + "I Agree Terms & Conditions": true, + "LinkedIn": true + }, + "Belgium": { + "What is your preferred name?": "John Doe", + "Do you now, or will you in the future, require visa sponsorship to work for our company in the country this role is advertised for?": "No", + "What are your salary expectations?": "60000", + "English": true, + "City\nCity": "Fake City, Belgium", + "I Agree Terms & Conditions": true, + "What language(s) do you speak and/or understand? What is your level?": "English, French - fluent", + "Are you legally authorized to work in the country of the job?": "Yes" + }, + "Netherlands": { + "What is your current location?": "Fake City, Netherlands", + "City\nCity": "Fake City, Netherlands", + "Legal Name (if different than above)": "John Doe", + "How did you hear about this job?": "LinkedIn", + "Do you now or will you in the future require immigration sponsorship to work at Company?": "No", + "What are your salary expectations?": "65000", + "This vacancy is for an internal position and we do not contract freelancers for this position. Do you acknowledge this statement?": "Yes" + }, + "Spain": { + "What is your level of proficiency in English?\nWhat is your level of proficiency in English?": "Native or bilingual", + "City\nCity": "Fake City, Spain", + "Indica tus expectativas salariales frente a un cambio.": "50000", + "Are you legally authorized to work in Spain?": "Yes", + "What is your salary expectation?": "50000" + } } } diff --git a/e2e_tests.py b/e2e_tests.py index 67293a0..a17eff9 100644 --- a/e2e_tests.py +++ b/e2e_tests.py @@ -1,7 +1,7 @@ import pytest from selenium import webdriver from selenium.webdriver.firefox.service import Service as FirefoxService -from easy_apply_linkedin import EasyApplyLinkedin +from main import EasyApplyLinkedin @pytest.fixture def setup_browser(): @@ -14,18 +14,79 @@ def setup_browser(): def setup_bot(setup_browser): data = { "email": "sendmessage@gabo.email", - "password": "bp8v9fvk#?QaKe7", - "keywords": ["TypeScript", "Angular", "React"], - "keywordsToAvoid": ["C++", ".NET"], - "locations": ["Switzerland", "Belgium"], + "password": "***,****,****", + "keywords": [ + "TypeScript", + "Angular", + "React", + "React Native", + "Node", + "JavaScript", + "Frontend Engineer", + "Full-Stack Engineer", + "Backend Engineer" + ], + "keywordsToAvoid": [ + "C++", + ".NET", + "Analyst", + "PHP", + "Python", + "C", + "Java", + "Go", + "Rust", + "Kotlin", + "Swift", + "Objective-C", + "Rust", + "Kotlin", + "Swift", + "C#", + ".Net", + ".net", + "Robotic", + "Data", + "Science", + "Cloud", + "Robotics", + "AI", + "ML", + "DL", + "NLP", + "CV", + "DevOps", + "Solidity" + ], + "locations": [ + "Canada", + "Portugal", + "Switzerland", + "Belgium", + "Netherlands", + "DACH", + "Benelux", + "European Union", + "European Economic Area", + "Germany", + "Spain", + "United States", + "United Kingdom" + ], "driver_path": "/usr/local/bin/geckodriver", "sortBy": "R", "filters": { "easy_apply": True, "experience": [], - "jobType": ["Full-time", "Contract"], + "jobType": [ + "Full-time", + "Contract" + ], "timePostedRange": [], - "workplaceType": ["Remote", "Hybrid"], + "workplaceType": [ + "Remote", + "Hybrid" + ], "less_than_10_applicants": False } } diff --git a/main.py b/main.py index 75c06d6..7d6a42b 100644 --- a/main.py +++ b/main.py @@ -72,17 +72,19 @@ class EasyApplyLinkedin: } LOCATION_MAPPING = { + "Canada": "101174742", + "Portugal": "100364837", "Switzerland": "106693272", - "Spain": "105646813", "United States": "103644278", - "United Kingdom": "101165590", - "European Union": "91000000", - "European Economic Area": "91000002", + "Belgium": "100565514", + "Netherlands": "102890719", "DACH": "91000006", "Benelux": "91000005", - "Netherlands": "102890719", - "Belgium": "100565514", + "European Union": "91000000", + "European Economic Area": "91000002", "Germany": "101282230", + "Spain": "105646813", + "United Kingdom": "101165590", } def __init__(self, data): @@ -413,6 +415,9 @@ def find_offers(self): job_list_container = self.find_element_with_retry(By.CLASS_NAME, "scaffold-layout__list-container") job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") + if index >= len(job_list_items): + break + job_item = job_list_items[index] # Scroll the element into view @@ -613,7 +618,6 @@ def fill_form(self, modal_dialog): break elif input_field.tag_name == "input" and input_field.get_attribute("type") == "file": - # Handle file upload response = self.get_file_response_for_label(label_text) input_field.send_keys(response) time.sleep(1) From 7c349db7278fb180f57271ea56dd57cad5e1d44b Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Thu, 11 Jul 2024 10:49:43 +0200 Subject: [PATCH 13/18] Dark mode added --- main.py | 19 +++++++++++++++++-- 1 file changed, 17 insertions(+), 2 deletions(-) diff --git a/main.py b/main.py index 7d6a42b..752ed8c 100644 --- a/main.py +++ b/main.py @@ -72,6 +72,7 @@ class EasyApplyLinkedin: } LOCATION_MAPPING = { + "Texas":"102748797", "Canada": "101174742", "Portugal": "100364837", "Switzerland": "106693272", @@ -178,6 +179,16 @@ def login_linkedin(self): """Log in to LinkedIn using the provided credentials.""" try: self.driver.get("https://www.linkedin.com/login") + self.driver.add_cookie({ + 'name': 'li_theme', + 'value': 'dark', + 'domain': '.linkedin.com', + 'path': '/', + 'expires': int(time.time() + 365 * 24 * 60 * 60), + 'secure': True, + 'httpOnly': False + }) + self.driver.refresh() WebDriverWait(self.driver, 10).until( EC.presence_of_element_located((By.NAME, "session_key")) ) @@ -247,8 +258,12 @@ def job_search(self): def construct_url(self): """Construct the URL for job search with applied filters.""" current_location = self.locations[self.current_location_index] + keywords_query = f'({self.keywords})' + keywords_to_avoid_query = f'NOT ({self.keywords_to_avoid})' + combined_keywords = f'{keywords_query} {keywords_to_avoid_query}' + params = { - "keywords": f"({self.keywords}) NOT ({self.keywords_to_avoid})", + "keywords": combined_keywords, "origin": "JOB_SEARCH_PAGE_JOB_FILTER", "refresh": "true", "sortBy": self.sort_by, @@ -691,4 +706,4 @@ def handle_captcha(self): bot.login_linkedin() bot.job_search() bot.find_offers() - bot.close_session() + bot.close_session() \ No newline at end of file From da5f924ce5ccc502d7ae46cdc7f7509625a9ebf4 Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Fri, 12 Jul 2024 01:53:30 +0200 Subject: [PATCH 14/18] one less bug one reason less to crash --- main.py | 12 +++++++++--- 1 file changed, 9 insertions(+), 3 deletions(-) diff --git a/main.py b/main.py index 752ed8c..d06c4fd 100644 --- a/main.py +++ b/main.py @@ -115,8 +115,12 @@ def init_logging(self): def load_json(self, path): """Load JSON data from the specified path.""" if path.exists(): - with path.open("r") as file: - return json.load(file) + try: + with path.open("r") as file: + return json.load(file) + except json.JSONDecodeError: + self.log_error(f"Error decoding JSON from {path}") + return {} return {} def save_json(self, path, data): @@ -242,6 +246,7 @@ def job_search(self): search_keywords.click() search_keywords.send_keys(Keys.RETURN) + time.sleep(5) # wait for the search results to load if not self.check_no_results(): break else: @@ -307,6 +312,7 @@ def apply_filters_and_search(self): while self.current_location_index < len(self.locations): search_url = self.construct_url() self.driver.get(search_url) + time.sleep(5) # wait for the search results to load if self.check_no_results(): self.log_info(f"No matching jobs found in {self.locations[self.current_location_index]}.") @@ -706,4 +712,4 @@ def handle_captcha(self): bot.login_linkedin() bot.job_search() bot.find_offers() - bot.close_session() \ No newline at end of file + bot.close_session() From c1997c19d2dbc59b331246108a472640e77d9e7b Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Fri, 12 Jul 2024 03:09:19 +0200 Subject: [PATCH 15/18] one less bug fixed crash with fielsets of checkboxes --- main.py | 138 +++++++++++++++++++++++++++++--------------------------- 1 file changed, 72 insertions(+), 66 deletions(-) diff --git a/main.py b/main.py index d06c4fd..eff9e78 100644 --- a/main.py +++ b/main.py @@ -72,7 +72,7 @@ class EasyApplyLinkedin: } LOCATION_MAPPING = { - "Texas":"102748797", + "Texas": "102748797", "Canada": "101174742", "Portugal": "100364837", "Switzerland": "106693272", @@ -246,7 +246,7 @@ def job_search(self): search_keywords.click() search_keywords.send_keys(Keys.RETURN) - time.sleep(5) # wait for the search results to load + time.sleep(5) if not self.check_no_results(): break else: @@ -312,7 +312,7 @@ def apply_filters_and_search(self): while self.current_location_index < len(self.locations): search_url = self.construct_url() self.driver.get(search_url) - time.sleep(5) # wait for the search results to load + time.sleep(5) if self.check_no_results(): self.log_info(f"No matching jobs found in {self.locations[self.current_location_index]}.") @@ -419,7 +419,7 @@ def find_offers(self): """Find and apply to job offers.""" while self.current_location_index < len(self.locations): self.apply_filters_and_search() - + current_page = 1 while True: @@ -440,13 +440,11 @@ def find_offers(self): break job_item = job_list_items[index] - - # Scroll the element into view + self.driver.execute_script("arguments[0].scrollIntoView(true);", job_item) time.sleep(1) - + try: - # Attempt to click the element with JavaScript self.driver.execute_script("arguments[0].click();", job_item) except ElementClickInterceptedException: self.log_info("Element click intercepted, skipping to next job...") @@ -461,14 +459,14 @@ def find_offers(self): ) company_name = self.get_company_name(job_item) - + if company_name in self.applied_companies: self.log_info(f"Already applied to a job at {company_name}, skipping...") self.close_application_modal() continue job_details_wrapper = self.find_element_with_retry(By.CLASS_NAME, "jobs-search__job-details--wrapper") - + try: apply_button = job_details_wrapper.find_element( By.CSS_SELECTOR, "button.jobs-apply-button.artdeco-button--primary" @@ -503,7 +501,7 @@ def find_offers(self): next_page_button = pagination_container.find_element( By.XPATH, f"//button[@aria-label='Page {current_page + 1}']", - ) + ) self.driver.execute_script("arguments[0].click();", next_page_button) time.sleep(2) current_page += 1 @@ -582,66 +580,50 @@ def fill_form(self, modal_dialog): for element in form_elements: try: label = element.find_element(By.CSS_SELECTOR, "label, legend") - input_field = element.find_element(By.CSS_SELECTOR, "input, select, textarea") label_text = label.text.strip() - if input_field.tag_name == "input" and input_field.get_attribute("type") == "text": - response = self.get_response_for_label(label_text) - if input_field.get_attribute("value") == "": - input_field.send_keys(response) - time.sleep(1) - input_field.send_keys(Keys.ARROW_DOWN) - input_field.send_keys(Keys.RETURN) - - elif input_field.tag_name == "select": - response = self.get_response_for_label(label_text) - select_options = input_field.find_elements(By.TAG_NAME, "option") - for option in select_options: - if option.get_attribute("value") == response: - option.click() - break + if "data-test-checkbox-form-component" in element.get_attribute("outerHTML"): + self.handle_checkboxes(element) + else: + input_field = element.find_element(By.CSS_SELECTOR, "input, select, textarea") - elif input_field.tag_name == "textarea": - response = self.get_response_for_label(label_text) - if input_field.get_attribute("value") == "": - input_field.send_keys(response) + if input_field.tag_name == "input" and input_field.get_attribute("type") == "text": + response = self.get_response_for_label(label_text) + if input_field.get_attribute("value") == "": + input_field.send_keys(response) + time.sleep(1) + input_field.send_keys(Keys.ARROW_DOWN) + input_field.send_keys(Keys.RETURN) + + elif input_field.tag_name == "select": + response = self.get_response_for_label(label_text) + select_options = input_field.find_elements(By.TAG_NAME, "option") + for option in select_options: + if option.get_attribute("value") == response: + option.click() + break - elif input_field.tag_name == "input" and input_field.get_attribute("type") == "checkbox": - checkboxes = element.find_elements(By.CSS_SELECTOR, "input[type='checkbox']") - for checkbox in checkboxes: - checkbox_label = checkbox.find_element(By.XPATH, "./following-sibling::label").text.strip() - response = self.get_checkbox_response_for_label(checkbox_label) - if response is not None: - try: - if response and not checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - elif not response and checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - except ElementClickInterceptedException: - self.driver.execute_script("arguments[0].click();", checkbox) - except StaleElementReferenceException: - checkbox = element.find_element(By.XPATH, f".//input[@type='checkbox' and ./following-sibling::label[text()='{checkbox_label}']]") - if response and not checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - elif not response and checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - - elif input_field.tag_name == "input" and input_field.get_attribute("type") == "radio": - radio_buttons = element.find_elements(By.CSS_SELECTOR, "input[type='radio']") - for radio in radio_buttons: - radio_label = radio.find_element(By.XPATH, "./following-sibling::label").text.strip() - response = self.get_radio_response_for_label(label_text, [rb.find_element(By.XPATH, "./following-sibling::label").text.strip() for rb in radio_buttons]) - if response.lower() == radio_label.lower(): - try: - radio.click() - except ElementClickInterceptedException: - self.driver.execute_script("arguments[0].click();", radio) - break + elif input_field.tag_name == "textarea": + response = self.get_response_for_label(label_text) + if input_field.get_attribute("value") == "": + input_field.send_keys(response) + + elif input_field.tag_name == "input" and input_field.get_attribute("type") == "radio": + radio_buttons = element.find_elements(By.CSS_SELECTOR, "input[type='radio']") + for radio in radio_buttons: + radio_label = radio.find_element(By.XPATH, "./following-sibling::label").text.strip() + response = self.get_radio_response_for_label(label_text, [rb.find_element(By.XPATH, "./following-sibling::label").text.strip() for rb in radio_buttons]) + if response.lower() == radio_label.lower(): + try: + radio.click() + except ElementClickInterceptedException: + self.driver.execute_script("arguments[0].click();", radio) + break - elif input_field.tag_name == "input" and input_field.get_attribute("type") == "file": - response = self.get_file_response_for_label(label_text) - input_field.send_keys(response) - time.sleep(1) + elif input_field.tag_name == "input" and input_field.get_attribute("type") == "file": + response = self.get_file_response_for_label(label_text) + input_field.send_keys(response) + time.sleep(1) except NoSuchElementException: continue @@ -653,6 +635,30 @@ def fill_form(self, modal_dialog): except NoSuchElementException: self.log_info("Next button not found, form might be complete or there is an issue.") + def handle_checkboxes(self, element): + """Handle multiple checkbox inputs.""" + checkboxes = element.find_elements(By.CSS_SELECTOR, "input[type='checkbox']") + for checkbox in checkboxes: + try: + checkbox_label = checkbox.find_element(By.XPATH, "./following-sibling::label").text.strip() + response = self.get_checkbox_response_for_label(checkbox_label) + if response is not None: + if response and not checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + elif not response and checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + except (ElementClickInterceptedException, StaleElementReferenceException): + self.log_info(f"Checkbox interaction failed for {checkbox_label}, attempting to retry.") + try: + checkbox = element.find_element(By.XPATH, f".//input[@type='checkbox' and ./following-sibling::label[text()='{checkbox_label}']]") + if response and not checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + elif not response and checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + except NoSuchElementException: + self.log_info(f"Checkbox not found after retry for {checkbox_label}.") + continue + def handle_done_button(self): """Handle the final done button after application submission.""" try: From ba7c2afeba66d8c25dae3fdfe440094eb01cb38c Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Fri, 12 Jul 2024 08:33:28 +0200 Subject: [PATCH 16/18] fieldset bug fixed --- main.py | 106 +++++++++++++++++++++++++++++++++----------------------- 1 file changed, 62 insertions(+), 44 deletions(-) diff --git a/main.py b/main.py index eff9e78..38267c6 100644 --- a/main.py +++ b/main.py @@ -72,7 +72,7 @@ class EasyApplyLinkedin: } LOCATION_MAPPING = { - "Texas": "102748797", + "Texas":"102748797", "Canada": "101174742", "Portugal": "100364837", "Switzerland": "106693272", @@ -246,7 +246,7 @@ def job_search(self): search_keywords.click() search_keywords.send_keys(Keys.RETURN) - time.sleep(5) + time.sleep(5) # wait for the search results to load if not self.check_no_results(): break else: @@ -312,7 +312,7 @@ def apply_filters_and_search(self): while self.current_location_index < len(self.locations): search_url = self.construct_url() self.driver.get(search_url) - time.sleep(5) + time.sleep(5) # wait for the search results to load if self.check_no_results(): self.log_info(f"No matching jobs found in {self.locations[self.current_location_index]}.") @@ -354,24 +354,6 @@ def get_response_for_label(self, label_text): self.update_config_file() return user_input - def get_checkbox_response_for_label(self, label_text): - """Get user response for a checkbox labeled by the given text.""" - current_location = self.locations[self.current_location_index] - if current_location in self.context_data["user_inputs"]: - location_specific_inputs = self.context_data["user_inputs"][current_location] - if label_text in location_specific_inputs: - return location_specific_inputs[label_text] - - while True: - user_input = input(f"Do you want to check the box for '{label_text}'? (yes/no): ").strip().lower() - if user_input in ["yes", "no"]: - response = user_input == "yes" - if current_location not in self.context_data["user_inputs"]: - self.context_data["user_inputs"][current_location] = {} - self.context_data["user_inputs"][current_location][label_text] = response - self.update_config_file() - return response - def get_radio_response_for_label(self, label_text, options): """Get user response for a radio button group labeled by the given text.""" current_location = self.locations[self.current_location_index] @@ -419,7 +401,7 @@ def find_offers(self): """Find and apply to job offers.""" while self.current_location_index < len(self.locations): self.apply_filters_and_search() - + current_page = 1 while True: @@ -440,11 +422,13 @@ def find_offers(self): break job_item = job_list_items[index] - + + # Scroll the element into view self.driver.execute_script("arguments[0].scrollIntoView(true);", job_item) time.sleep(1) - + try: + # Attempt to click the element with JavaScript self.driver.execute_script("arguments[0].click();", job_item) except ElementClickInterceptedException: self.log_info("Element click intercepted, skipping to next job...") @@ -459,14 +443,14 @@ def find_offers(self): ) company_name = self.get_company_name(job_item) - + if company_name in self.applied_companies: self.log_info(f"Already applied to a job at {company_name}, skipping...") self.close_application_modal() continue job_details_wrapper = self.find_element_with_retry(By.CLASS_NAME, "jobs-search__job-details--wrapper") - + try: apply_button = job_details_wrapper.find_element( By.CSS_SELECTOR, "button.jobs-apply-button.artdeco-button--primary" @@ -501,7 +485,7 @@ def find_offers(self): next_page_button = pagination_container.find_element( By.XPATH, f"//button[@aria-label='Page {current_page + 1}']", - ) + ) self.driver.execute_script("arguments[0].click();", next_page_button) time.sleep(2) current_page += 1 @@ -638,26 +622,60 @@ def fill_form(self, modal_dialog): def handle_checkboxes(self, element): """Handle multiple checkbox inputs.""" checkboxes = element.find_elements(By.CSS_SELECTOR, "input[type='checkbox']") - for checkbox in checkboxes: + for index in range(len(checkboxes)): + checkbox_label = None try: + checkbox = checkboxes[index] checkbox_label = checkbox.find_element(By.XPATH, "./following-sibling::label").text.strip() response = self.get_checkbox_response_for_label(checkbox_label) if response is not None: - if response and not checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - elif not response and checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - except (ElementClickInterceptedException, StaleElementReferenceException): - self.log_info(f"Checkbox interaction failed for {checkbox_label}, attempting to retry.") - try: - checkbox = element.find_element(By.XPATH, f".//input[@type='checkbox' and ./following-sibling::label[text()='{checkbox_label}']]") - if response and not checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - elif not response and checkbox.is_selected(): - self.driver.execute_script("arguments[0].click();", checkbox) - except NoSuchElementException: - self.log_info(f"Checkbox not found after retry for {checkbox_label}.") - continue + self.set_checkbox_state(checkbox, checkbox_label, response) + except (ElementClickInterceptedException, StaleElementReferenceException) as e: + self.log_info(f"Checkbox interaction failed for {checkbox_label}, attempting to retry. Error: {e}") + self.retry_checkbox_interaction(element, index) + + def retry_checkbox_interaction(self, element, index): + """Retry interaction with the checkbox in case of exceptions.""" + retries = 3 + while retries > 0: + retries -= 1 + try: + checkboxes = element.find_elements(By.CSS_SELECTOR, "input[type='checkbox']") + checkbox = checkboxes[index] + checkbox_label = checkbox.find_element(By.XPATH, "./following-sibling::label").text.strip() + response = self.get_checkbox_response_for_label(checkbox_label) + if response is not None: + self.set_checkbox_state(checkbox, checkbox_label, response) + return + except (NoSuchElementException, StaleElementReferenceException) as e: + self.log_info(f"Retry failed for {checkbox_label}. Error: {e}") + if retries == 0: + self.log_info(f"Skipping {checkbox_label} after multiple retries.") + + def set_checkbox_state(self, checkbox, checkbox_label, response): + """Set the state of a checkbox.""" + if response and not checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + elif not response and checkbox.is_selected(): + self.driver.execute_script("arguments[0].click();", checkbox) + + def get_checkbox_response_for_label(self, label_text): + """Get user response for a checkbox labeled by the given text.""" + current_location = self.locations[self.current_location_index] + if current_location not in self.context_data["user_inputs"]: + self.context_data["user_inputs"][current_location] = {} + + location_specific_inputs = self.context_data["user_inputs"][current_location] + if label_text in location_specific_inputs: + return location_specific_inputs[label_text] + + while True: + user_input = input(f"Do you want to check the box for '{label_text}'? (yes/no): ").strip().lower() + if user_input in ["yes", "no"]: + response = user_input == "yes" + location_specific_inputs[label_text] = response + self.update_config_file() + return response def handle_done_button(self): """Handle the final done button after application submission.""" @@ -718,4 +736,4 @@ def handle_captcha(self): bot.login_linkedin() bot.job_search() bot.find_offers() - bot.close_session() + bot.close_session() \ No newline at end of file From 95fe614a62260b2d0262f3450911f4282e115fb2 Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Tue, 16 Jul 2024 14:49:21 +0200 Subject: [PATCH 17/18] updated logging dropdown options to terminal --- main.py | 22 ++++++++++++++-------- 1 file changed, 14 insertions(+), 8 deletions(-) diff --git a/main.py b/main.py index 38267c6..9e7882d 100644 --- a/main.py +++ b/main.py @@ -72,7 +72,7 @@ class EasyApplyLinkedin: } LOCATION_MAPPING = { - "Texas":"102748797", + "Texas": "102748797", "Canada": "101174742", "Portugal": "100364837", "Switzerland": "106693272", @@ -188,7 +188,7 @@ def login_linkedin(self): 'value': 'dark', 'domain': '.linkedin.com', 'path': '/', - 'expires': int(time.time() + 365 * 24 * 60 * 60), + 'expires': int(time.time() + 365 * 24 * 60 * 60), 'secure': True, 'httpOnly': False }) @@ -263,9 +263,7 @@ def job_search(self): def construct_url(self): """Construct the URL for job search with applied filters.""" current_location = self.locations[self.current_location_index] - keywords_query = f'({self.keywords})' - keywords_to_avoid_query = f'NOT ({self.keywords_to_avoid})' - combined_keywords = f'{keywords_query} {keywords_to_avoid_query}' + combined_keywords = f'{self.keywords} NOT {self.keywords_to_avoid}' params = { "keywords": combined_keywords, @@ -559,15 +557,23 @@ def handle_easy_apply(self): def fill_form(self, modal_dialog): """Fill out the application form.""" form_elements = modal_dialog.find_elements( - By.CSS_SELECTOR, "div[data-test-form-element], fieldset[data-test-form-builder-radio-button-form-component], fieldset[data-test-checkbox-form-component]" + By.CSS_SELECTOR, "div[data-test-form-element], fieldset[data-test-form-builder-radio-button-form-component], fieldset[data-test-checkbox-form-component], div[data-test-text-entity-list-form-component]" ) for element in form_elements: try: - label = element.find_element(By.CSS_SELECTOR, "label, legend") + label = element.find_element(By.CSS_SELECTOR, "label, legend, span[aria-hidden='true']") label_text = label.text.strip() if "data-test-checkbox-form-component" in element.get_attribute("outerHTML"): self.handle_checkboxes(element) + elif "data-test-text-entity-list-form-component" in element.get_attribute("outerHTML"): + select_element = element.find_element(By.CSS_SELECTOR, "select") + options = [option.text for option in select_element.find_elements(By.TAG_NAME, "option")] + response = self.get_radio_response_for_label(label_text, options[1:]) # Exclude "Select an option" + for option in select_element.find_elements(By.TAG_NAME, "option"): + if option.text == response: + option.click() + break else: input_field = element.find_element(By.CSS_SELECTOR, "input, select, textarea") @@ -736,4 +742,4 @@ def handle_captcha(self): bot.login_linkedin() bot.job_search() bot.find_offers() - bot.close_session() \ No newline at end of file + bot.close_session() From 7d800970f8972786ad50afe6637ac7478af44b45 Mon Sep 17 00:00:00 2001 From: Gabo_Tech Date: Tue, 23 Jul 2024 00:55:19 +0200 Subject: [PATCH 18/18] Added collections filter --- configExample.json | 1 + main.py | 171 ++++++++++++++++++++++++++++++++------------- 2 files changed, 123 insertions(+), 49 deletions(-) diff --git a/configExample.json b/configExample.json index 01c3f67..603289f 100644 --- a/configExample.json +++ b/configExample.json @@ -68,6 +68,7 @@ ], "less_than_10_applicants": false }, + "collection": "", "aiContext": { "preferences": { "workplaceType": "Remote", diff --git a/main.py b/main.py index 9e7882d..fe1a178 100644 --- a/main.py +++ b/main.py @@ -18,9 +18,14 @@ ) from selenium.webdriver.firefox.service import Service as FirefoxService - class EasyApplyLinkedin: BASE_URL = "https://www.linkedin.com/jobs/search/" + COLLECTION_URLS = { + "small_business": "https://www.linkedin.com/jobs/collections/small-business", + "remote_jobs": "https://www.linkedin.com/jobs/collections/remote-jobs", + "easy_apply": "https://www.linkedin.com/jobs/collections/easy-apply", + "top_applicant": "https://www.linkedin.com/jobs/collections/top-applicant" + } ERROR_LOG_PATH = Path("error_log.json") APPLIED_COMPANIES_LOG_PATH = Path("applied_companies_log.json") FAILED_APPLICATIONS_LOG_PATH = Path("failed_applications_log.json") @@ -89,13 +94,13 @@ class EasyApplyLinkedin: } def __init__(self, data): - """Initialize the EasyApplyLinkedin instance with user data.""" self.email = data["email"] self.password = data["password"] self.keywords = " OR ".join(data["keywords"]) self.keywords_to_avoid = " NOT ".join(data["keywordsToAvoid"]) self.locations = data["locations"] self.filters = data["filters"] + self.collection = data.get("collection", "") self.sort_by = data["sortBy"] self.context_data = data self.current_location_index = 0 @@ -106,14 +111,12 @@ def __init__(self, data): self.init_logging() def init_logging(self): - """Initialize logging for error and applied companies.""" logging.basicConfig(level=logging.INFO) self.error_logger = logging.getLogger("ErrorLogger") self.applied_companies = self.load_json(self.APPLIED_COMPANIES_LOG_PATH) self.failed_applications = self.load_json(self.FAILED_APPLICATIONS_LOG_PATH) def load_json(self, path): - """Load JSON data from the specified path.""" if path.exists(): try: with path.open("r") as file: @@ -124,12 +127,10 @@ def load_json(self, path): return {} def save_json(self, path, data): - """Save JSON data to the specified path.""" with path.open("w") as file: json.dump(data, file, indent=4) def log_error(self, error_msg): - """Log error messages with a timestamp.""" self.error_logger.error(error_msg) errors = self.load_json(self.ERROR_LOG_PATH) errors[str(datetime.now())] = error_msg @@ -137,24 +138,20 @@ def log_error(self, error_msg): self.cleanup_error_log() def log_info(self, message): - """Log informational messages.""" logging.info(message) def cleanup_error_log(self): - """Clean up old error logs older than 1 day.""" errors = self.load_json(self.ERROR_LOG_PATH) cutoff = datetime.now() - timedelta(days=1) errors = {k: v for k, v in errors.items() if datetime.fromisoformat(k) > cutoff} self.save_json(self.ERROR_LOG_PATH, errors) def log_applied_company(self, company): - """Log the company to which an application was submitted.""" self.applied_companies[company] = str(datetime.now()) self.save_json(self.APPLIED_COMPANIES_LOG_PATH, self.applied_companies) self.cleanup_applied_companies_log() def cleanup_applied_companies_log(self): - """Clean up logs of applied companies older than 2 weeks.""" cutoff = datetime.now() - timedelta(weeks=2) self.applied_companies = { k: v @@ -164,13 +161,11 @@ def cleanup_applied_companies_log(self): self.save_json(self.APPLIED_COMPANIES_LOG_PATH, self.applied_companies) def log_failed_application(self, company): - """Log the company where application failed.""" self.failed_applications[company] = str(datetime.now()) self.save_json(self.FAILED_APPLICATIONS_LOG_PATH, self.failed_applications) self.cleanup_failed_applications_log() def cleanup_failed_applications_log(self): - """Clean up logs of failed applications older than 2 weeks.""" cutoff = datetime.now() - timedelta(weeks=2) self.failed_applications = { k: v @@ -180,7 +175,6 @@ def cleanup_failed_applications_log(self): self.save_json(self.FAILED_APPLICATIONS_LOG_PATH, self.failed_applications) def login_linkedin(self): - """Log in to LinkedIn using the provided credentials.""" try: self.driver.get("https://www.linkedin.com/login") self.driver.add_cookie({ @@ -213,7 +207,6 @@ def login_linkedin(self): self.log_error(f"Login error: {e}") def job_search(self): - """Perform job search based on keywords and locations.""" while self.current_location_index < len(self.locations): try: WebDriverWait(self.driver, 20).until( @@ -227,8 +220,7 @@ def job_search(self): ) ) search_keywords = self.driver.find_element( - By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']" - ) + By.CSS_SELECTOR, "input[aria-label='Search by title, skill, or company']") search_keywords.clear() search_keywords.send_keys(self.keywords) search_keywords.send_keys(" NOT ") @@ -239,14 +231,13 @@ def job_search(self): ) ) search_location = self.driver.find_element( - By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']" - ) + By.CSS_SELECTOR, "input[aria-label='City, state, or zip code']") search_location.clear() search_location.send_keys(self.locations[self.current_location_index]) search_keywords.click() search_keywords.send_keys(Keys.RETURN) - time.sleep(5) # wait for the search results to load + time.sleep(5) if not self.check_no_results(): break else: @@ -261,7 +252,6 @@ def job_search(self): self.current_location_index += 1 def construct_url(self): - """Construct the URL for job search with applied filters.""" current_location = self.locations[self.current_location_index] combined_keywords = f'{self.keywords} NOT {self.keywords_to_avoid}' @@ -306,11 +296,10 @@ def construct_url(self): return url def apply_filters_and_search(self): - """Apply filters to the job search and navigate to the search URL.""" while self.current_location_index < len(self.locations): search_url = self.construct_url() self.driver.get(search_url) - time.sleep(5) # wait for the search results to load + time.sleep(5) if self.check_no_results(): self.log_info(f"No matching jobs found in {self.locations[self.current_location_index]}.") @@ -319,7 +308,6 @@ def apply_filters_and_search(self): break def check_no_results(self): - """Check if the job search resulted in no matches.""" try: no_results_element = self.driver.find_element( By.CSS_SELECTOR, "div.jobs-search-no-results-banner" @@ -329,7 +317,6 @@ def check_no_results(self): return False def find_element_with_retry(self, by, value, retries=3, delay=2): - """Find an element with retry logic.""" for _ in range(retries): try: return self.driver.find_element(by, value) @@ -338,7 +325,6 @@ def find_element_with_retry(self, by, value, retries=3, delay=2): raise NoSuchElementException(f"Element not found: {by}, {value}") def get_response_for_label(self, label_text): - """Get user response for a given label text.""" current_location = self.locations[self.current_location_index] if current_location in self.context_data["user_inputs"]: location_specific_inputs = self.context_data["user_inputs"][current_location] @@ -353,7 +339,6 @@ def get_response_for_label(self, label_text): return user_input def get_radio_response_for_label(self, label_text, options): - """Get user response for a radio button group labeled by the given text.""" current_location = self.locations[self.current_location_index] if current_location in self.context_data["user_inputs"]: location_specific_inputs = self.context_data["user_inputs"][current_location] @@ -376,7 +361,6 @@ def get_radio_response_for_label(self, label_text, options): print("Invalid input, please try again.") def get_file_response_for_label(self, label_text): - """Get user response for a file upload labeled by the given text.""" current_location = self.locations[self.current_location_index] if current_location in self.context_data["user_inputs"]: location_specific_inputs = self.context_data["user_inputs"][current_location] @@ -391,15 +375,19 @@ def get_file_response_for_label(self, label_text): return user_input def update_config_file(self): - """Update the configuration file with the latest user inputs.""" with open("config.json", "w") as config_file: json.dump(self.context_data, config_file, indent=4) def find_offers(self): - """Find and apply to job offers.""" + if self.collection: + self.apply_collection() + else: + self.apply_filtered_jobs() + + def apply_filtered_jobs(self): while self.current_location_index < len(self.locations): self.apply_filters_and_search() - + current_page = 1 while True: @@ -420,13 +408,10 @@ def find_offers(self): break job_item = job_list_items[index] - - # Scroll the element into view self.driver.execute_script("arguments[0].scrollIntoView(true);", job_item) time.sleep(1) - + try: - # Attempt to click the element with JavaScript self.driver.execute_script("arguments[0].click();", job_item) except ElementClickInterceptedException: self.log_info("Element click intercepted, skipping to next job...") @@ -441,7 +426,7 @@ def find_offers(self): ) company_name = self.get_company_name(job_item) - + if company_name in self.applied_companies: self.log_info(f"Already applied to a job at {company_name}, skipping...") self.close_application_modal() @@ -497,8 +482,108 @@ def find_offers(self): self.current_location_index += 1 + def apply_collection(self): + collection_url = self.COLLECTION_URLS.get(self.collection) + if not collection_url: + self.log_error(f"Invalid collection: {self.collection}") + return + + self.driver.get(collection_url) + time.sleep(5) + + current_page = 1 + + while True: + try: + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located((By.CLASS_NAME, "scaffold-layout__list-container")) + ) + + job_list_container = self.find_element_with_retry(By.CLASS_NAME, "scaffold-layout__list-container") + job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") + + for index in range(len(job_list_items)): + try: + job_list_container = self.find_element_with_retry(By.CLASS_NAME, "scaffold-layout__list-container") + job_list_items = job_list_container.find_elements(By.TAG_NAME, "li") + + if index >= len(job_list_items): + break + + job_item = job_list_items[index] + self.driver.execute_script("arguments[0].scrollIntoView(true);", job_item) + time.sleep(1) + + try: + self.driver.execute_script("arguments[0].click();", job_item) + except ElementClickInterceptedException: + self.log_info("Element click intercepted, skipping to next job...") + continue + + time.sleep(2) + + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located( + (By.CLASS_NAME, "jobs-search__job-details--wrapper") + ) + ) + + company_name = self.get_company_name(job_item) + + if company_name in self.applied_companies: + self.log_info(f"Already applied to a job at {company_name}, skipping...") + self.close_application_modal() + continue + + job_details_wrapper = self.find_element_with_retry(By.CLASS_NAME, "jobs-search__job-details--wrapper") + + try: + apply_button = job_details_wrapper.find_element( + By.CSS_SELECTOR, "button.jobs-apply-button.artdeco-button--primary" + ) + apply_button.click() + time.sleep(2) + + WebDriverWait(self.driver, 10).until( + EC.presence_of_element_located( + (By.CSS_SELECTOR, "div.jobs-easy-apply-modal") + ) + ) + + try: + self.handle_easy_apply() + self.log_applied_company(company_name) + except Exception as e: + self.log_info(f"Failed to apply at {company_name}: {str(e)}") + self.log_failed_application(company_name) + + except NoSuchElementException: + self.log_info("No apply button found, continuing to next job...") + continue + + except (NoSuchElementException, ElementNotInteractableException, StaleElementReferenceException) as e: + self.log_info(f"Exception occurred: {e}, continuing to next job...") + self.log_error(f"Find offers error: {e}") + continue + + try: + pagination_container = self.find_element_with_retry(By.CLASS_NAME, "artdeco-pagination__pages") + next_page_button = pagination_container.find_element( + By.XPATH, + f"//button[@aria-label='Page {current_page + 1}']", + ) + self.driver.execute_script("arguments[0].click();", next_page_button) + time.sleep(2) + current_page += 1 + except NoSuchElementException: + self.log_info("No more pages left.") + break + except TimeoutException: + self.log_info("Timeout while waiting for job list container.") + self.log_error("Timeout while waiting for job list container.") + break + def get_company_name(self, job_item): - """Extract the company name from a job listing.""" try: company_element = job_item.find_element( By.CSS_SELECTOR, @@ -509,7 +594,6 @@ def get_company_name(self, job_item): return None def handle_easy_apply(self): - """Handle the easy apply process.""" while True: try: modal_dialog = WebDriverWait(self.driver, 10).until( @@ -555,7 +639,6 @@ def handle_easy_apply(self): break def fill_form(self, modal_dialog): - """Fill out the application form.""" form_elements = modal_dialog.find_elements( By.CSS_SELECTOR, "div[data-test-form-element], fieldset[data-test-form-builder-radio-button-form-component], fieldset[data-test-checkbox-form-component], div[data-test-text-entity-list-form-component]" ) @@ -569,7 +652,7 @@ def fill_form(self, modal_dialog): elif "data-test-text-entity-list-form-component" in element.get_attribute("outerHTML"): select_element = element.find_element(By.CSS_SELECTOR, "select") options = [option.text for option in select_element.find_elements(By.TAG_NAME, "option")] - response = self.get_radio_response_for_label(label_text, options[1:]) # Exclude "Select an option" + response = self.get_radio_response_for_label(label_text, options[1:]) for option in select_element.find_elements(By.TAG_NAME, "option"): if option.text == response: option.click() @@ -626,7 +709,6 @@ def fill_form(self, modal_dialog): self.log_info("Next button not found, form might be complete or there is an issue.") def handle_checkboxes(self, element): - """Handle multiple checkbox inputs.""" checkboxes = element.find_elements(By.CSS_SELECTOR, "input[type='checkbox']") for index in range(len(checkboxes)): checkbox_label = None @@ -641,7 +723,6 @@ def handle_checkboxes(self, element): self.retry_checkbox_interaction(element, index) def retry_checkbox_interaction(self, element, index): - """Retry interaction with the checkbox in case of exceptions.""" retries = 3 while retries > 0: retries -= 1 @@ -659,14 +740,12 @@ def retry_checkbox_interaction(self, element, index): self.log_info(f"Skipping {checkbox_label} after multiple retries.") def set_checkbox_state(self, checkbox, checkbox_label, response): - """Set the state of a checkbox.""" if response and not checkbox.is_selected(): self.driver.execute_script("arguments[0].click();", checkbox) elif not response and checkbox.is_selected(): self.driver.execute_script("arguments[0].click();", checkbox) def get_checkbox_response_for_label(self, label_text): - """Get user response for a checkbox labeled by the given text.""" current_location = self.locations[self.current_location_index] if current_location not in self.context_data["user_inputs"]: self.context_data["user_inputs"][current_location] = {} @@ -684,7 +763,6 @@ def get_checkbox_response_for_label(self, label_text): return response def handle_done_button(self): - """Handle the final done button after application submission.""" try: done_button = WebDriverWait(self.driver, 10).until( EC.presence_of_element_located((By.CSS_SELECTOR, "button.artdeco-button.artdeco-button--primary")) @@ -695,7 +773,6 @@ def handle_done_button(self): self.log_info("Done button not found, skipping to next job.") def close_application_modal(self): - """Close the application modal.""" try: close_button = WebDriverWait(self.driver, 10).until( EC.presence_of_element_located( @@ -712,7 +789,6 @@ def close_application_modal(self): self.log_info("Close button not found, skipping to next job.") def handle_discard_dialog(self): - """Handle the discard dialog when closing the application modal.""" try: discard_button = WebDriverWait(self.driver, 10).until( EC.presence_of_element_located( @@ -725,16 +801,13 @@ def handle_discard_dialog(self): self.log_info("Discard button not found, skipping to next job.") def close_session(self): - """Close the browser session.""" self.log_info("End of the session") self.driver.close() self.driver.quit() def handle_captcha(self): - """Handle CAPTCHA prompts manually.""" input("CAPTCHA detected. Please solve the CAPTCHA manually and then press Enter to continue...") - if __name__ == "__main__": with open("config.json") as config_file: data = json.load(config_file)