library(XML)
library(rvest)
## Warning: package 'rvest' was built under R version 3.4.2
## Loading required package: xml2
## Warning: package 'xml2' was built under R version 3.4.2
##
## Attaching package: 'rvest'
## The following object is masked from 'package:XML':
##
## xml
library(stringr)
Deloitte - Data Scientist Engineer
Cyber1 <- read_html("https://jobs2.deloitte.com/us/en/job/DELOA004X152711/Cyber-Data-Scientist-Engineer?src=JB-16801")
Cyber1
## {xml_document}
## <html lang="en">
## [1] <head>\n<meta charset="UTF-8">\n<meta http-equiv="X-UA-Compatible" c ...
## [2] <body class="jobDetails cookie us en null">\n<header class="navbar ...
Cyber1_Skills <- html_nodes(Cyber1, "ul:nth-child(19), ul:nth-child(16)")
Cyber1_Skills
## {xml_nodeset (2)}
## [1] <ul>\n<li><div><font size="2" face="Verdana">Bachelor<U+0092>s Degree in co ...
## [2] <ul>\n<li><div><font color="black" size="2" face="Verdana">Previous ...
Cyber1_skills1 <- html_text(Cyber1_Skills)
Cyber1_skills1
## [1] "Bachelor<U+0092>s Degree in computer science, mathematics, or statistics, or related field2+ years of relevant consulting or industry experienceProven experience effectively prioritizing workload to meet deadlines and work objectivesDemonstrated ability to write clearly, succinctly, and in a manner that appeals to a wide audienceProficiency in word processing, spreadsheet, and presentation creation tools, as well as Internet research toolsAbility to obtain and maintain the required clearance for this roleAt least a Secret ClearanceSQL Python Amazon Web Services (AWS) Business Intelligence Reporting Agile Software Development Methodology Advanced Statistical Analysis & Modeling"
## [2] "Previous Federal Consulting experienceUnderstanding of fundamental cloud computing conceptsExperience with Information Assurance concepts and processes within the Federal governmentKnowledge of and experience with Federal security regulations, standards, and processes including FISMA, FIPS, NIST, and FedRAMPApache KafkaNetflow aggregators, e.g. StealthWatchLog aggregation systems, e.g. Splunk, ELKNetwork monitoring systems, e.g. Bro, SuricataPacket processingExperience with at least one of the following:DockerApache JenaApache Mesos"
Since the words are connected, I didn’t know how to seperate them without using specific spacing, so I took the individual requirements.
Deloitte1 <- str_extract(Cyber1_skills1[1], fixed("Bachelor's Degree in computer science, mathematics, or statistics, or related field", ignore_case = TRUE))
Deloitte2 <- str_extract(Cyber1_skills1[1], fixed("2+ years of relevant consulting or industry experience", ignore_case = TRUE))
Deloitte3 <- str_extract(Cyber1_skills1[1], fixed("Proven experience effectively prioritizing workload to meet deadlines and work objectives", ignore_case = TRUE))
Deloitte4 <- str_extract(Cyber1_skills1[1], fixed("Demonstrated ability to write clearly, succinctly, and in a manner that appeals to a wide audience", ignore_case = TRUE))
Deloitte5 <- str_extract(Cyber1_skills1[1], fixed("Proficiency in word processing, spreadsheet, and presentation creation tools, as well as Internet research tools", ignore_case = TRUE))
Deloitte6 <- str_extract(Cyber1_skills1[1], fixed("Ability to obtain and maintain the required clearance for this role", ignore_case = TRUE))
Deloitte7 <- str_extract(Cyber1_skills1[1], fixed("At least a Secret Clearance", ignore_case = TRUE))
Deloitte8 <- str_extract(Cyber1_skills1[1], fixed("SQL", ignore_case = TRUE))
Deloitte9 <- str_extract(Cyber1_skills1[1], fixed("Python Amazon Web Services", ignore_case = TRUE))
Deloitte10 <- str_extract(Cyber1_skills1[1], fixed("Business Intelligence Reporting", ignore_case = TRUE))
Deloitte11 <- str_extract(Cyber1_skills1[1], fixed("Agile Software Development Methodology", ignore_case = TRUE))
Deloitte12 <- str_extract(Cyber1_skills1[1], fixed("Advanced Statistical Analysis & Modeling", ignore_case = TRUE))
cyber1_skills1_Required <- c(Deloitte1,Deloitte2,Deloitte3,Deloitte4,Deloitte5,Deloitte6,Deloitte7,Deloitte8,Deloitte9,Deloitte10,Deloitte11,Deloitte12)
cyber1_skills1_Required
## [1] NA
## [2] "2+ years of relevant consulting or industry experience"
## [3] "Proven experience effectively prioritizing workload to meet deadlines and work objectives"
## [4] "Demonstrated ability to write clearly, succinctly, and in a manner that appeals to a wide audience"
## [5] "Proficiency in word processing, spreadsheet, and presentation creation tools, as well as Internet research tools"
## [6] "Ability to obtain and maintain the required clearance for this role"
## [7] "At least a Secret Clearance"
## [8] "SQL"
## [9] "Python Amazon Web Services"
## [10] "Business Intelligence Reporting"
## [11] "Agile Software Development Methodology"
## [12] "Advanced Statistical Analysis & Modeling"
Deloitte.1 <- str_extract(Cyber1_skills1[2], fixed("Previous Federal Consulting experience", ignore_case = TRUE))
Deloitte.2 <- str_extract(Cyber1_skills1[2], fixed("Understanding of fundamental cloud computing concepts", ignore_case = TRUE))
Deloitte.3 <- str_extract(Cyber1_skills1[2], fixed("Experience with Information Assurance concepts and processes within the Federal governmen", ignore_case = TRUE))
Deloitte.4 <- str_extract(Cyber1_skills1[2], fixed("Knowledge of and experience with Federal security regulations, standards, and processes including FISMA, FIPS, NIST, and FedRAMP", ignore_case = TRUE))
Deloitte.5 <- str_extract(Cyber1_skills1[2], fixed("Apache Kafka", ignore_case = TRUE))
Deloitte.6 <- str_extract(Cyber1_skills1[2], fixed("Netflow aggregators, e.g. StealthWatch", ignore_case = TRUE))
Deloitte.7 <- str_extract(Cyber1_skills1[2], fixed("Log aggregation systems, e.g. Splunk, ELK", ignore_case = TRUE))
Deloitte.8 <- str_extract(Cyber1_skills1[2], fixed("Network monitoring systems, e.g. Bro, Suricata", ignore_case = TRUE))
Deloitte.9 <- str_extract(Cyber1_skills1[2], fixed("Packet processing", ignore_case = TRUE))
Deloitte.10 <- str_extract(Cyber1_skills1[2], fixed("Docker", ignore_case = TRUE))
Deloitte.11 <- str_extract(Cyber1_skills1[2], fixed("Apache Jena", ignore_case = TRUE))
Deloitte.12 <- str_extract(Cyber1_skills1[2], fixed("Apache Mesos", ignore_case = TRUE))
cyber1_skills1_Preferred <- c(Deloitte.1,Deloitte.2,Deloitte.3,Deloitte.4,Deloitte.5,Deloitte.6,Deloitte.7,Deloitte.8,Deloitte.9,Deloitte.10,Deloitte.11,Deloitte.12)
cyber1_skills1_Preferred
## [1] "Previous Federal Consulting experience"
## [2] "Understanding of fundamental cloud computing concepts"
## [3] "Experience with Information Assurance concepts and processes within the Federal governmen"
## [4] "Knowledge of and experience with Federal security regulations, standards, and processes including FISMA, FIPS, NIST, and FedRAMP"
## [5] "Apache Kafka"
## [6] "Netflow aggregators, e.g. StealthWatch"
## [7] "Log aggregation systems, e.g. Splunk, ELK"
## [8] "Network monitoring systems, e.g. Bro, Suricata"
## [9] "Packet processing"
## [10] "Docker"
## [11] "Apache Jena"
## [12] "Apache Mesos"
Cyber1_skills1_all <- list(c(cyber1_skills1_Required,cyber1_skills1_Preferred))
Cyber1_skills1_all
## [[1]]
## [1] NA
## [2] "2+ years of relevant consulting or industry experience"
## [3] "Proven experience effectively prioritizing workload to meet deadlines and work objectives"
## [4] "Demonstrated ability to write clearly, succinctly, and in a manner that appeals to a wide audience"
## [5] "Proficiency in word processing, spreadsheet, and presentation creation tools, as well as Internet research tools"
## [6] "Ability to obtain and maintain the required clearance for this role"
## [7] "At least a Secret Clearance"
## [8] "SQL"
## [9] "Python Amazon Web Services"
## [10] "Business Intelligence Reporting"
## [11] "Agile Software Development Methodology"
## [12] "Advanced Statistical Analysis & Modeling"
## [13] "Previous Federal Consulting experience"
## [14] "Understanding of fundamental cloud computing concepts"
## [15] "Experience with Information Assurance concepts and processes within the Federal governmen"
## [16] "Knowledge of and experience with Federal security regulations, standards, and processes including FISMA, FIPS, NIST, and FedRAMP"
## [17] "Apache Kafka"
## [18] "Netflow aggregators, e.g. StealthWatch"
## [19] "Log aggregation systems, e.g. Splunk, ELK"
## [20] "Network monitoring systems, e.g. Bro, Suricata"
## [21] "Packet processing"
## [22] "Docker"
## [23] "Apache Jena"
## [24] "Apache Mesos"
Next Gen Cyber - Data Scientist
Cyber2 <- read_html("https://www.nextgencybercareers.com/job/183/data-scientist/")
Cyber2
## {xml_document}
## <html lang="en">
## [1] <head>\n<meta http-equiv="Content-Type" content="text/html; charset= ...
## [2] <body>\n <nav class="navbar navbar-default"><div class="container ...
Cyber2_Skills <- html_nodes(Cyber2, "ul:nth-child(10) , ul:nth-child(8)")
Cyber2_Skills
## {xml_nodeset (2)}
## [1] <ul>\n<li>BS, MS, or PhD in Computer Science, Engineering or related ...
## [2] <ul>\n<li>Experience with applied machine learning or algorithm deve ...
Cyber2_Skills2 <- html_text(Cyber2_Skills)
Cyber2_Skills2
## [1] "BS, MS, or PhD in Computer Science, Engineering or related field\n2+ years experience with Python, Scala, or Java and distributed frameworks (Hadoop, Spark, etc.)\nExperience with<U+0085>\nRapid prototyping and advanced analytics (e.g. R, MatLab, Pandas, SciPy)\nSQL and Relational Databases\nPossess a strong blend of technology and analytical skill\nDemonstrable successes in delivering analytical projects, including structuring and conducting analyses to generate business insights and recommendations\nSolution/Delivery-oriented team player willing to go above and beyond\nAbility to work beyond familiar algorithms - to get out of one<U+0092>s comfort zone and earnestly seek to integrate the best solutions to business challenges\nHigh motivation, work ethic, and self-discipline to organize and complete tasks\nSincere interest in working at a startup and scaling with the company as we grow\n"
## [2] "Experience with applied machine learning or algorithm development\nExperience or interest in the life sciences industry\nTrack record of delivering analytical solutions to poorly scoped problems\nPrior client-side analytical experience serving Marketing, Sales, Medical Affairs, or Clinical Development, or, vendor-side analytical experience working with Life Sciences clients\nExperience working with proprietary secondary data including medical / pharmacy claims, prescription data, sales data, and longitudinal patient-level data\n"
This one is seperated by “”, so it was easier to split.
NextCyber_Required <- str_split(Cyber2_Skills2[1],pattern = "\n")
NextCyber_Required
## [[1]]
## [1] "BS, MS, or PhD in Computer Science, Engineering or related field"
## [2] "2+ years experience with Python, Scala, or Java and distributed frameworks (Hadoop, Spark, etc.)"
## [3] "Experience with<U+0085>"
## [4] "Rapid prototyping and advanced analytics (e.g. R, MatLab, Pandas, SciPy)"
## [5] "SQL and Relational Databases"
## [6] "Possess a strong blend of technology and analytical skill"
## [7] "Demonstrable successes in delivering analytical projects, including structuring and conducting analyses to generate business insights and recommendations"
## [8] "Solution/Delivery-oriented team player willing to go above and beyond"
## [9] "Ability to work beyond familiar algorithms - to get out of one<U+0092>s comfort zone and earnestly seek to integrate the best solutions to business challenges"
## [10] "High motivation, work ethic, and self-discipline to organize and complete tasks"
## [11] "Sincere interest in working at a startup and scaling with the company as we grow"
## [12] ""
NextCyber_Preferred <- str_split(Cyber2_Skills2[2],pattern = "\n")
NextCyber_Preferred
## [[1]]
## [1] "Experience with applied machine learning or algorithm development"
## [2] "Experience or interest in the life sciences industry"
## [3] "Track record of delivering analytical solutions to poorly scoped problems"
## [4] "Prior client-side analytical experience serving Marketing, Sales, Medical Affairs, or Clinical Development, or, vendor-side analytical experience working with Life Sciences clients"
## [5] "Experience working with proprietary secondary data including medical / pharmacy claims, prescription data, sales data, and longitudinal patient-level data"
## [6] ""
Cyber2_skills2_all <- list(c(NextCyber_Required,NextCyber_Preferred))
Cyber2_skills2_all
## [[1]]
## [[1]][[1]]
## [1] "BS, MS, or PhD in Computer Science, Engineering or related field"
## [2] "2+ years experience with Python, Scala, or Java and distributed frameworks (Hadoop, Spark, etc.)"
## [3] "Experience with<U+0085>"
## [4] "Rapid prototyping and advanced analytics (e.g. R, MatLab, Pandas, SciPy)"
## [5] "SQL and Relational Databases"
## [6] "Possess a strong blend of technology and analytical skill"
## [7] "Demonstrable successes in delivering analytical projects, including structuring and conducting analyses to generate business insights and recommendations"
## [8] "Solution/Delivery-oriented team player willing to go above and beyond"
## [9] "Ability to work beyond familiar algorithms - to get out of one<U+0092>s comfort zone and earnestly seek to integrate the best solutions to business challenges"
## [10] "High motivation, work ethic, and self-discipline to organize and complete tasks"
## [11] "Sincere interest in working at a startup and scaling with the company as we grow"
## [12] ""
##
## [[1]][[2]]
## [1] "Experience with applied machine learning or algorithm development"
## [2] "Experience or interest in the life sciences industry"
## [3] "Track record of delivering analytical solutions to poorly scoped problems"
## [4] "Prior client-side analytical experience serving Marketing, Sales, Medical Affairs, or Clinical Development, or, vendor-side analytical experience working with Life Sciences clients"
## [5] "Experience working with proprietary secondary data including medical / pharmacy claims, prescription data, sales data, and longitudinal patient-level data"
## [6] ""
Security Score Card Inc. - Senior Data Scientist
Cyber3 <- read_html("https://www.glassdoor.com/job-listing/senior-data-scientist-securityscorecard-JV_IC1132348_KO0,21_KE22,39.htm?jl=1978832215")
Cyber3
## {xml_document}
## <html lang="en" xmlns:fb="http://www.facebook.com/2008/fbml" xmlns:og="http://opengraph.org/schema/" class="flex">
## [1] <head>\n<meta http-equiv="Content-Type" content="text/html; charset= ...
## [2] <body class="main flex loggedOut lang-en en-US hollywood " marginwid ...
Cyber3_Skills <- html_nodes(Cyber3,"p:nth-child(3) , #JobDescContainer p:nth-child(2)")
Cyber3_Skills
## {xml_nodeset (2)}
## [1] <p><strong>What you have</strong><br>- Security experience in a comm ...
## [2] <p><strong>Tools you'll use</strong><br>- Python<br>- Open-source nu ...
Cyber3_Skills3 <- html_text(Cyber3_Skills)
Cyber3_Skills3
## [1] "What you have- Security experience in a commercial environment - Experience and love for problems with large data sets, machine learning, visualization, and cyber security - Commercial experience developing predictive models or classifiers- Experience with ETL techniques - Clear, concise, and effective communication skills (written and verbal) - Ability to collaborate with engineers across different teams to understand and solve problems- Understanding of Agile development practices *Bonus: knowledge of NLP concepts "
## [2] "Tools you'll use- Python- Open-source numerical and scientific libraries - Scikit- AWS- Postgres- D3*Nice to have: Scala"
Security_Scorecard_1 <- str_split(Cyber3_Skills3[1],pattern = "- ")
Security_Scorecard_1
## [[1]]
## [1] "What you have"
## [2] "Security experience in a commercial environment "
## [3] "Experience and love for problems with large data sets, machine learning, visualization, and cyber security "
## [4] "Commercial experience developing predictive models or classifiers"
## [5] "Experience with ETL techniques "
## [6] "Clear, concise, and effective communication skills (written and verbal) "
## [7] "Ability to collaborate with engineers across different teams to understand and solve problems"
## [8] "Understanding of Agile development practices *Bonus: knowledge of NLP concepts "
Security_Scorecard_2 <- str_split(Cyber3_Skills3[2],pattern = "- ")
Security_Scorecard_2
## [[1]]
## [1] "Tools you'll use"
## [2] "Python"
## [3] "Open-source numerical and scientific libraries "
## [4] "Scikit"
## [5] "AWS"
## [6] "Postgres"
## [7] "D3*Nice to have: Scala"
Cyber3_skills3_all<- list(c(Security_Scorecard_1,Security_Scorecard_2))
Cyber3_skills3_all
## [[1]]
## [[1]][[1]]
## [1] "What you have"
## [2] "Security experience in a commercial environment "
## [3] "Experience and love for problems with large data sets, machine learning, visualization, and cyber security "
## [4] "Commercial experience developing predictive models or classifiers"
## [5] "Experience with ETL techniques "
## [6] "Clear, concise, and effective communication skills (written and verbal) "
## [7] "Ability to collaborate with engineers across different teams to understand and solve problems"
## [8] "Understanding of Agile development practices *Bonus: knowledge of NLP concepts "
##
## [[1]][[2]]
## [1] "Tools you'll use"
## [2] "Python"
## [3] "Open-source numerical and scientific libraries "
## [4] "Scikit"
## [5] "AWS"
## [6] "Postgres"
## [7] "D3*Nice to have: Scala"
Novetta - Cyber Security Data Scientist
Cyber4 <- read_html("https://career4.successfactors.com/career?career_ns=job_listing&company=novetta&navBarLevel=JOB_SEARCH&rcm_site_locale=en_US&career_job_req_id=22561&selected_lang=en_US&jobAlertController_jobAlertId=&jobAlertController_jobAlertName=&_s.crb=n17kqKsnxhTfHbEykMzNLGiVOjw=&jobPipeline=Indeed")
Cyber4
## {xml_document}
## <html lang="en">
## [1] <head>\n<meta http-equiv="Content-Type" content="text/html; charset= ...
## [2] <body class="" onload="">\n\n\n<script type="text/javascript"> windo ...
Cyber4_Skills <- html_nodes(Cyber4, "p:nth-child(23) , p:nth-child(24) , p:nth-child(25) , p:nth-child(19) , p:nth-child(20) , p:nth-child(18) , p:nth-child(17) , p:nth-child(16) , p:nth-child(15)")
Cyber4_Skills
## {xml_nodeset (9)}
## [1] <p>BS in Data Analytics, Applied Mathematics, Statistics, Econometri ...
## [2] <p>1+ year of experience in data analytics, data science, data minin ...
## [3] <p>Proven hands-on experience with Python, Ruby, R, or another data ...
## [4] <p>Proven experience developing ETL processes, developing data model ...
## [5] <p>Interest in or knowledge of cyber threat landscape to include com ...
## [6] <p>Interest in or knowledge of global political and security issues</p>
## [7] <p>MS in Applied Mathematics, Statistics, Econometrics, Operations R ...
## [8] <p>Strong background in Python, Ruby, R, and/or other development fo ...
## [9] <p>Familiarity or experience with IBM SPSS Modeler </p>
Cyber4_Skills4_all <- html_text(Cyber4_Skills)
Cyber4_Skills4_all
## [1] "BS in Data Analytics, Applied Mathematics, Statistics, Econometrics, Operations Research, Computer Engineering, Computer Science, Electrical Engineering, Information Technology or related field"
## [2] "1+ year of experience in data analytics, data science, data mining, or closely related field"
## [3] "Proven hands-on experience with Python, Ruby, R, or another data processing programming language"
## [4] "Proven experience developing ETL processes, developing data models, and analyzing multi-source data"
## [5] "Interest in or knowledge of cyber threat landscape to include common tactics, techniques, and procedures"
## [6] "Interest in or knowledge of global political and security issues"
## [7] "MS in Applied Mathematics, Statistics, Econometrics, Operations Research, Computer Engineering, Computer Science, Electrical Engineering, Information Technology or related field plus two years of work experience"
## [8] "Strong background in Python, Ruby, R, and/or other development for data analysis"
## [9] "Familiarity or experience with IBM SPSS Modeler "
CIA - Data Scientist
Cyber5 <- read_html("https://www.cia.gov/careers/opportunities/science-technology/data-scientist.html")
Cyber5
## {xml_document}
## <html xmlns="http://www.w3.org/1999/xhtml" class="no-js" lang="en" xml:lang="en">
## [1] <head>\n<meta http-equiv="Content-Type" content="text/html; charset= ...
## [2] <body class="template-document_view_job portaltype-agencyjob site-CI ...
Cyber5_Skills <- html_nodes(Cyber5,"ul:nth-child(17) li , ul:nth-child(15) li")
Cyber5_Skills
## {xml_nodeset (8)}
## [1] <li>Master's degree in a data science equivalent field or sub-field< ...
## [2] <li>Experience working with data rich problems through research or p ...
## [3] <li>Experience with computer programming</li>
## [4] <li>Ability to successfully complete projects with large or incomple ...
## [5] <li><b>Your resume. <br></b></li>
## [6] <li><b>A cover letter in which you specify your qualifications for o ...
## [7] <li><b>Unofficial transcripts for all degrees.</b></li>
## [8] <li><b>A writing sample, five (5) pages MAXIMUM, single spaced, tech ...
Cyber5_Skills5_all <- html_text(Cyber5_Skills)
Cyber5_Skills5_all
## [1] "Master's degree in a data science equivalent field or sub-field"
## [2] "Experience working with data rich problems through research or programs"
## [3] "Experience with computer programming"
## [4] "Ability to successfully complete projects with large or incomplete data sets and provide solutions"
## [5] "Your resume. "
## [6] "A cover letter in which you specify your qualifications for one or more positions."
## [7] "Unofficial transcripts for all degrees."
## [8] "A writing sample, five (5) pages MAXIMUM, single spaced, technical or analytic paper that focuses on your current area of expertise or interest and is related to your interest in positions at CIA. You can excerpt longer papers."
Battelle - Cyber Computer Scientist
Cyber6 <- read_html("http://jobs.battelle.org/ShowJob/Id/1358503/Cyber%20Computer%20Scientist%20Early%20Career")
Cyber6
## {xml_document}
## <html lang="en" class="no-js">
## [1] <head>\n<meta http-equiv="Content-Type" content="text/html; charset= ...
## [2] <body class="template debug">\r\n<!-- Google Tag Manager (noscript) ...
Cyber6_Skills <- html_nodes(Cyber6,"ul:nth-child(25) , ul:nth-child(22)")
Cyber6_Skills
## {xml_nodeset (2)}
## [1] <ul>\n<li>Bachelor<U+0092>s degree in Computer Science, Computer Engineerin ...
## [2] <ul>\n<li>Ability to apply learned cyber skills to real life scenari ...
Cyber6_Skills6 <- html_text(Cyber6_Skills)
Cyber6_Skills6
## [1] "Bachelor<U+0092>s degree in Computer Science, Computer Engineering, or related field of study, or equivalent experience\n\t0-2 years<U+0092> experience in Computer Science, Computer Engineering, or related technical area\n\tAbility to code in C, C++, or C#\n\tDevelop Software to run in either user-mode or kernel-mode\n\tAutomate tasks using a scripting language (Python, Perl, Ruby, etc.)\n\tUnderstand network protocols\n\tAbility to demonstrate good organization, communication, problem-solving and teamwork skills\n\tMust be a sole US citizen with the ability to obtain and maintain a US government security clearance\n"
## [2] "Ability to apply learned cyber skills to real life scenarios (internships, hack-a-thons, cyber security clubs, CTFs, etc.)\n\tAbility to develop protocols for all layers throughout the network stack\n\tBackground in software engineering and architecture\n\tExperience with network architecture and security mechanisms\n\tKnowledge of cryptographic algorithms (AES, RSA, etc.)\n\tPrevious exposure to malware reverse engineering\n\tActive Secret or Top Secret clearance\n"
Cyber6_Skills6_All <- str_split(Cyber6_Skills6, pattern = "\n\t")
Cyber6_Skills6_All
## [[1]]
## [1] "Bachelor<U+0092>s degree in Computer Science, Computer Engineering, or related field of study, or equivalent experience"
## [2] "0-2 years<U+0092> experience in Computer Science, Computer Engineering, or related technical area"
## [3] "Ability to code in C, C++, or C#"
## [4] "Develop Software to run in either user-mode or kernel-mode"
## [5] "Automate tasks using a scripting language (Python, Perl, Ruby, etc.)"
## [6] "Understand network protocols"
## [7] "Ability to demonstrate good organization, communication, problem-solving and teamwork skills"
## [8] "Must be a sole US citizen with the ability to obtain and maintain a US government security clearance\n"
##
## [[2]]
## [1] "Ability to apply learned cyber skills to real life scenarios (internships, hack-a-thons, cyber security clubs, CTFs, etc.)"
## [2] "Ability to develop protocols for all layers throughout the network stack"
## [3] "Background in software engineering and architecture"
## [4] "Experience with network architecture and security mechanisms"
## [5] "Knowledge of cryptographic algorithms (AES, RSA, etc.)"
## [6] "Previous exposure to malware reverse engineering"
## [7] "Active Secret or Top Secret clearance\n"
Amazon - Data Scientist/Security Architect
Cyber7 <- read_html("https://www.amazon.jobs/en/jobs/575969/data-scientist-security-architect")
Cyber7
## {xml_document}
## <html prefix="og: http://ogp.me/ns#">
## [1] <head>\n<meta http-equiv="Content-Type" content="text/html; charset= ...
## [2] <body>\n<div class="sb-slidebar" off-canvas="navbar-slider right ove ...
## [3] <script>$(document).ready(function() {\n CXT.SLIDEBARS_INITIALIZER. ...
Cyber7_Skills <- html_nodes(Cyber7, "#job-detail .section+ .section p")
Cyber7_Skills
## {xml_nodeset (2)}
## [1] <p><br>Education and experience:<br>·Either<U+0085> Phd/MTech/MS or equival ...
## [2] <p><br>· Track record of diving into data to discover hidden pattern ...
Cyber7_Skills7 <- html_text(Cyber7_Skills)
Cyber7_Skills7
## [1] "Education and experience:·Either<U+0085> Phd/MTech/MS or equivalent degree in Computer Science or Mathematics or Statistics with 3-5 years experience in predictive modeling, data science and analysisOR·Bachelor or Masters Degree in a highly quantitative field (Computer Science, Machine Learning, Operational Research, Statistics, Mathematics, etc.) 5+ years experience in predictive modeling, data science and analysis· Experience using Python and/or R· Experience using SparkML and other ML libraries such as scikit-learn, caret, mlr, MLlib· Experience manipulating and transforming large datasets· Hands-on comfort with a subset of SQL, Hadoop ecosystem (Hive, Spark, etc.), NoSQL, Key/Value stores, document stores· Experience in supporting internal and external customers. You understand what it means to draw out critical customer needs and focus your knowledge and creativity to deliver practical outcomes addressing those needs.In addition, you should have familiarity with information security and/or cloud services and be excited about developing these skills further:Information Security:· Commercial security solutions such as web application firewalls, IDS/IPS, SIEM, DLP, DDOS mitigation· Experience automating IT & security tasks· Building security reference architecture for cloud deployments and hybrid scenarios· Implementation experience with enterprise security solutions such as WAF, IPS, Anti-DDOS, and SIEMCloud Services:· Experience handling terabyte size datasets"
## [2] "· Track record of diving into data to discover hidden patterns· Strong troubleshooting and problem-solving skills· Effective communication and strong collaboration skillsInformation Security· Understanding of enterprise risk management methods and techniques to drive successful outcomes in a multi-national environment· Understanding architectural implications of meeting industry standards such as PCI DSS, ISO 27001, HIPAA, and NIST/DoD frameworks.Cloud Services· Experience with AWS Services· Working knowledge of cloud computing technologies and workload transition challenges· Familiarity with distributed computational approaches· Experience with scalable, distributed computing frameworks· Familiarity with archive, backup/recovery and business continuity processes in distributed operationsAmazon.com is an Equal Opportunity-Affirmative Action Employer <U+0096> Minority / Female / Disability / Veteran / Gender Identity / Sexual Orientationaws-proserv-na"
Amazon_Qualifications <- str_split(Cyber7_Skills7[1],pattern = "·")
Amazon_Qualifications
## [[1]]
## [1] "Education and experience:"
## [2] "Either<U+0085> Phd/MTech/MS or equivalent degree in Computer Science or Mathematics or Statistics with 3-5 years experience in predictive modeling, data science and analysisOR"
## [3] "Bachelor or Masters Degree in a highly quantitative field (Computer Science, Machine Learning, Operational Research, Statistics, Mathematics, etc.) 5+ years experience in predictive modeling, data science and analysis"
## [4] " Experience using Python and/or R"
## [5] " Experience using SparkML and other ML libraries such as scikit-learn, caret, mlr, MLlib"
## [6] " Experience manipulating and transforming large datasets"
## [7] " Hands-on comfort with a subset of SQL, Hadoop ecosystem (Hive, Spark, etc.), NoSQL, Key/Value stores, document stores"
## [8] " Experience in supporting internal and external customers. You understand what it means to draw out critical customer needs and focus your knowledge and creativity to deliver practical outcomes addressing those needs.In addition, you should have familiarity with information security and/or cloud services and be excited about developing these skills further:Information Security:"
## [9] " Commercial security solutions such as web application firewalls, IDS/IPS, SIEM, DLP, DDOS mitigation"
## [10] " Experience automating IT & security tasks"
## [11] " Building security reference architecture for cloud deployments and hybrid scenarios"
## [12] " Implementation experience with enterprise security solutions such as WAF, IPS, Anti-DDOS, and SIEMCloud Services:"
## [13] " Experience handling terabyte size datasets"
Amazon_Preferred <- str_split(Cyber7_Skills7[2],"·")
Amazon_Preferred
## [[1]]
## [1] ""
## [2] " Track record of diving into data to discover hidden patterns"
## [3] " Strong troubleshooting and problem-solving skills"
## [4] " Effective communication and strong collaboration skillsInformation Security"
## [5] " Understanding of enterprise risk management methods and techniques to drive successful outcomes in a multi-national environment"
## [6] " Understanding architectural implications of meeting industry standards such as PCI DSS, ISO 27001, HIPAA, and NIST/DoD frameworks.Cloud Services"
## [7] " Experience with AWS Services"
## [8] " Working knowledge of cloud computing technologies and workload transition challenges"
## [9] " Familiarity with distributed computational approaches"
## [10] " Experience with scalable, distributed computing frameworks"
## [11] " Familiarity with archive, backup/recovery and business continuity processes in distributed operationsAmazon.com is an Equal Opportunity-Affirmative Action Employer <U+0096> Minority / Female / Disability / Veteran / Gender Identity / Sexual Orientationaws-proserv-na"
Cyber7_Skills7_all <- list(c(Amazon_Qualifications,Amazon_Preferred))
Cyber7_Skills7_all
## [[1]]
## [[1]][[1]]
## [1] "Education and experience:"
## [2] "Either<U+0085> Phd/MTech/MS or equivalent degree in Computer Science or Mathematics or Statistics with 3-5 years experience in predictive modeling, data science and analysisOR"
## [3] "Bachelor or Masters Degree in a highly quantitative field (Computer Science, Machine Learning, Operational Research, Statistics, Mathematics, etc.) 5+ years experience in predictive modeling, data science and analysis"
## [4] " Experience using Python and/or R"
## [5] " Experience using SparkML and other ML libraries such as scikit-learn, caret, mlr, MLlib"
## [6] " Experience manipulating and transforming large datasets"
## [7] " Hands-on comfort with a subset of SQL, Hadoop ecosystem (Hive, Spark, etc.), NoSQL, Key/Value stores, document stores"
## [8] " Experience in supporting internal and external customers. You understand what it means to draw out critical customer needs and focus your knowledge and creativity to deliver practical outcomes addressing those needs.In addition, you should have familiarity with information security and/or cloud services and be excited about developing these skills further:Information Security:"
## [9] " Commercial security solutions such as web application firewalls, IDS/IPS, SIEM, DLP, DDOS mitigation"
## [10] " Experience automating IT & security tasks"
## [11] " Building security reference architecture for cloud deployments and hybrid scenarios"
## [12] " Implementation experience with enterprise security solutions such as WAF, IPS, Anti-DDOS, and SIEMCloud Services:"
## [13] " Experience handling terabyte size datasets"
##
## [[1]][[2]]
## [1] ""
## [2] " Track record of diving into data to discover hidden patterns"
## [3] " Strong troubleshooting and problem-solving skills"
## [4] " Effective communication and strong collaboration skillsInformation Security"
## [5] " Understanding of enterprise risk management methods and techniques to drive successful outcomes in a multi-national environment"
## [6] " Understanding architectural implications of meeting industry standards such as PCI DSS, ISO 27001, HIPAA, and NIST/DoD frameworks.Cloud Services"
## [7] " Experience with AWS Services"
## [8] " Working knowledge of cloud computing technologies and workload transition challenges"
## [9] " Familiarity with distributed computational approaches"
## [10] " Experience with scalable, distributed computing frameworks"
## [11] " Familiarity with archive, backup/recovery and business continuity processes in distributed operationsAmazon.com is an Equal Opportunity-Affirmative Action Employer <U+0096> Minority / Female / Disability / Veteran / Gender Identity / Sexual Orientationaws-proserv-na"
Intelletec - Data Scientist Cyber Security
Cyber8<- read_html("https://www.intelletec.com/jobs/senior-data-scientist-cyber-security")
Cyber8
## {xml_document}
## <html lang="en" class="no-js">
## [1] <head>\n<meta http-equiv="Content-Type" content="text/html; charset= ...
## [2] <body>\n <div>\n <div class="connecting-linkedin"><p>Conne ...
Cyber8_Skills <- html_nodes(Cyber8,".col-sm-12.clearfix li:nth-child(3) , #body li:nth-child(7) , #body li:nth-child(6) , .col-sm-12.clearfix li:nth-child(5) , .col-sm-12.clearfix li:nth-child(4) , .col-sm-12.clearfix li:nth-child(2) , .col-sm-12.clearfix li:nth-child(1)")
Cyber8_Skills
## {xml_nodeset (7)}
## [1] <li>Minimum 5 years of Data Science experience</li>
## [2] <li>At least 1 year of leadership experience required </li>
## [3] <li>\n<strong>Machine Learning</strong> and <strong>Cyber Security</ ...
## [4] <li>Experience with <strong>ETL </strong>Pipelines</li>
## [5] <li>\n<strong>NLP</strong> experience</li>
## [6] <li>Experience or familiarity with <strong>Python</strong>, <strong> ...
## [7] <li><strong>Strong Written and Verbal communication a Must</strong>< ...
Cyber8_Skills_all <- html_text(Cyber8_Skills)
Cyber8_Skills_all
## [1] "Minimum 5 years of Data Science experience"
## [2] "At least 1 year of leadership experience required "
## [3] "Machine Learning and Cyber Security experience"
## [4] "Experience with ETL Pipelines"
## [5] "NLP experience"
## [6] "Experience or familiarity with Python, AWS, Scikit, Postgres, D3 and/or Scala"
## [7] "Strong Written and Verbal communication a Must"
JP Morgan Chase - Data Protection Engineer/Cyber Security
Cyber9 <- read_html("https://jobs.jpmorganchase.com/ShowJob/Id/68258/Data-Protection-Engineer-Cyber-Security/")
Cyber9
## {xml_document}
## <html lang="en" class="no-js">
## [1] <head prefix="og: http://ogp.me/ns# fb: http://ogp.me/ns/fb# article ...
## [2] <body id="details">\r\n\r\n\t<header><div id="sticky-anchor"></div>\ ...
Cyber9_Skills <- html_nodes(Cyber9,"li div")
Cyber9_Skills
## {xml_nodeset (14)}
## [1] <div>\n<font size="2" face="Tahoma">7+ years of overall IT engineer ...
## [2] <div><font size="2" face="Tahoma"><u>Data Protection</u> - Data Los ...
## [3] <div><font size="2" face="Tahoma">Extensive experience in a Red Hat ...
## [4] <div><font size="2" face="Tahoma">Extensive experience with network ...
## [5] <div><font size="2" face="Tahoma">Experience with scripting languag ...
## [6] <div><font size="2" face="Tahoma">Experience with large scale netwo ...
## [7] <div><font size="2" face="Tahoma">Ability to support and liaise wit ...
## [8] <div><font size="2" face="Tahoma">Must be able to work collaborativ ...
## [9] <div><font size="2" face="Tahoma">Must possess a high degree of ini ...
## [10] <div><font size="2" face="Tahoma">Ability to communicate security, ...
## [11] <div><font size="2" face="Tahoma">Data Loss Prevention concepts and ...
## [12] <div><font size="2" face="Tahoma">Data encryption concepts and prod ...
## [13] <div><font size="2" face="Tahoma">Data classification concepts and ...
## [14] <div><font size="2" face="Tahoma">Tokenization, data masking, data ...
Cyber9_Skills_all <- html_text(Cyber9_Skills)
Cyber9_Skills_all
## [1] "7+ years of overall IT engineering or architecture experience with a proven background in Cyber Security specific to:"
## [2] "Data Protection - Data Loss Prevention (DLP), Encryption, Cryptography, Tokenization, Access Control, Data Classification, PKI or the supporting of these security solutions."
## [3] "Extensive experience in a Red Hat Environment"
## [4] "Extensive experience with networking protocols and concepts "
## [5] "Experience with scripting languages such as Java, Shell, Python, or PowerShell"
## [6] "Experience with large scale networks including Microsoft Exchange and Active Directory"
## [7] "Ability to support and liaise with business process owners to incorporate data protection products and provisions into their processes."
## [8] "Must be able to work collaboratively with other areas to advocate information security solutions."
## [9] "Must possess a high degree of initiative, motivation, and problem-solving skills."
## [10] "Ability to communicate security, data protection, data loss prevention related concepts to a broad range of technical and non-technical staff, including senior business leaders"
## [11] "Data Loss Prevention concepts and products (such as Symantec DLP, Digital Guardian, RSA or Mcafee DLP, etc<U+0085>)"
## [12] "Data encryption concepts and products (such as Vormetric, Protegrity, Voltage, etc<U+0085>)"
## [13] "Data classification concepts and products (such as Titus, Varonis, etc<U+0085>)"
## [14] "Tokenization, data masking, data dispersion techniques"
All Requirements listed
Cyber_skills_all <-
list(c(Cyber1_skills1_all,Cyber2_skills2_all,Cyber3_skills3_all,Cyber4_Skills4_all,Cyber5_Skills5_all,Cyber6_Skills6_All,Cyber7_Skills7_all,Cyber8_Skills_all,Cyber9_Skills_all))
Cyber_skills_all
## [[1]]
## [[1]][[1]]
## [1] NA
## [2] "2+ years of relevant consulting or industry experience"
## [3] "Proven experience effectively prioritizing workload to meet deadlines and work objectives"
## [4] "Demonstrated ability to write clearly, succinctly, and in a manner that appeals to a wide audience"
## [5] "Proficiency in word processing, spreadsheet, and presentation creation tools, as well as Internet research tools"
## [6] "Ability to obtain and maintain the required clearance for this role"
## [7] "At least a Secret Clearance"
## [8] "SQL"
## [9] "Python Amazon Web Services"
## [10] "Business Intelligence Reporting"
## [11] "Agile Software Development Methodology"
## [12] "Advanced Statistical Analysis & Modeling"
## [13] "Previous Federal Consulting experience"
## [14] "Understanding of fundamental cloud computing concepts"
## [15] "Experience with Information Assurance concepts and processes within the Federal governmen"
## [16] "Knowledge of and experience with Federal security regulations, standards, and processes including FISMA, FIPS, NIST, and FedRAMP"
## [17] "Apache Kafka"
## [18] "Netflow aggregators, e.g. StealthWatch"
## [19] "Log aggregation systems, e.g. Splunk, ELK"
## [20] "Network monitoring systems, e.g. Bro, Suricata"
## [21] "Packet processing"
## [22] "Docker"
## [23] "Apache Jena"
## [24] "Apache Mesos"
##
## [[1]][[2]]
## [[1]][[2]][[1]]
## [1] "BS, MS, or PhD in Computer Science, Engineering or related field"
## [2] "2+ years experience with Python, Scala, or Java and distributed frameworks (Hadoop, Spark, etc.)"
## [3] "Experience with<U+0085>"
## [4] "Rapid prototyping and advanced analytics (e.g. R, MatLab, Pandas, SciPy)"
## [5] "SQL and Relational Databases"
## [6] "Possess a strong blend of technology and analytical skill"
## [7] "Demonstrable successes in delivering analytical projects, including structuring and conducting analyses to generate business insights and recommendations"
## [8] "Solution/Delivery-oriented team player willing to go above and beyond"
## [9] "Ability to work beyond familiar algorithms - to get out of one<U+0092>s comfort zone and earnestly seek to integrate the best solutions to business challenges"
## [10] "High motivation, work ethic, and self-discipline to organize and complete tasks"
## [11] "Sincere interest in working at a startup and scaling with the company as we grow"
## [12] ""
##
## [[1]][[2]][[2]]
## [1] "Experience with applied machine learning or algorithm development"
## [2] "Experience or interest in the life sciences industry"
## [3] "Track record of delivering analytical solutions to poorly scoped problems"
## [4] "Prior client-side analytical experience serving Marketing, Sales, Medical Affairs, or Clinical Development, or, vendor-side analytical experience working with Life Sciences clients"
## [5] "Experience working with proprietary secondary data including medical / pharmacy claims, prescription data, sales data, and longitudinal patient-level data"
## [6] ""
##
##
## [[1]][[3]]
## [[1]][[3]][[1]]
## [1] "What you have"
## [2] "Security experience in a commercial environment "
## [3] "Experience and love for problems with large data sets, machine learning, visualization, and cyber security "
## [4] "Commercial experience developing predictive models or classifiers"
## [5] "Experience with ETL techniques "
## [6] "Clear, concise, and effective communication skills (written and verbal) "
## [7] "Ability to collaborate with engineers across different teams to understand and solve problems"
## [8] "Understanding of Agile development practices *Bonus: knowledge of NLP concepts "
##
## [[1]][[3]][[2]]
## [1] "Tools you'll use"
## [2] "Python"
## [3] "Open-source numerical and scientific libraries "
## [4] "Scikit"
## [5] "AWS"
## [6] "Postgres"
## [7] "D3*Nice to have: Scala"
##
##
## [[1]][[4]]
## [1] "BS in Data Analytics, Applied Mathematics, Statistics, Econometrics, Operations Research, Computer Engineering, Computer Science, Electrical Engineering, Information Technology or related field"
##
## [[1]][[5]]
## [1] "1+ year of experience in data analytics, data science, data mining, or closely related field"
##
## [[1]][[6]]
## [1] "Proven hands-on experience with Python, Ruby, R, or another data processing programming language"
##
## [[1]][[7]]
## [1] "Proven experience developing ETL processes, developing data models, and analyzing multi-source data"
##
## [[1]][[8]]
## [1] "Interest in or knowledge of cyber threat landscape to include common tactics, techniques, and procedures"
##
## [[1]][[9]]
## [1] "Interest in or knowledge of global political and security issues"
##
## [[1]][[10]]
## [1] "MS in Applied Mathematics, Statistics, Econometrics, Operations Research, Computer Engineering, Computer Science, Electrical Engineering, Information Technology or related field plus two years of work experience"
##
## [[1]][[11]]
## [1] "Strong background in Python, Ruby, R, and/or other development for data analysis"
##
## [[1]][[12]]
## [1] "Familiarity or experience with IBM SPSS Modeler "
##
## [[1]][[13]]
## [1] "Master's degree in a data science equivalent field or sub-field"
##
## [[1]][[14]]
## [1] "Experience working with data rich problems through research or programs"
##
## [[1]][[15]]
## [1] "Experience with computer programming"
##
## [[1]][[16]]
## [1] "Ability to successfully complete projects with large or incomplete data sets and provide solutions"
##
## [[1]][[17]]
## [1] "Your resume. "
##
## [[1]][[18]]
## [1] "A cover letter in which you specify your qualifications for one or more positions."
##
## [[1]][[19]]
## [1] "Unofficial transcripts for all degrees."
##
## [[1]][[20]]
## [1] "A writing sample, five (5) pages MAXIMUM, single spaced, technical or analytic paper that focuses on your current area of expertise or interest and is related to your interest in positions at CIA. You can excerpt longer papers."
##
## [[1]][[21]]
## [1] "Bachelor<U+0092>s degree in Computer Science, Computer Engineering, or related field of study, or equivalent experience"
## [2] "0-2 years<U+0092> experience in Computer Science, Computer Engineering, or related technical area"
## [3] "Ability to code in C, C++, or C#"
## [4] "Develop Software to run in either user-mode or kernel-mode"
## [5] "Automate tasks using a scripting language (Python, Perl, Ruby, etc.)"
## [6] "Understand network protocols"
## [7] "Ability to demonstrate good organization, communication, problem-solving and teamwork skills"
## [8] "Must be a sole US citizen with the ability to obtain and maintain a US government security clearance\n"
##
## [[1]][[22]]
## [1] "Ability to apply learned cyber skills to real life scenarios (internships, hack-a-thons, cyber security clubs, CTFs, etc.)"
## [2] "Ability to develop protocols for all layers throughout the network stack"
## [3] "Background in software engineering and architecture"
## [4] "Experience with network architecture and security mechanisms"
## [5] "Knowledge of cryptographic algorithms (AES, RSA, etc.)"
## [6] "Previous exposure to malware reverse engineering"
## [7] "Active Secret or Top Secret clearance\n"
##
## [[1]][[23]]
## [[1]][[23]][[1]]
## [1] "Education and experience:"
## [2] "Either<U+0085> Phd/MTech/MS or equivalent degree in Computer Science or Mathematics or Statistics with 3-5 years experience in predictive modeling, data science and analysisOR"
## [3] "Bachelor or Masters Degree in a highly quantitative field (Computer Science, Machine Learning, Operational Research, Statistics, Mathematics, etc.) 5+ years experience in predictive modeling, data science and analysis"
## [4] " Experience using Python and/or R"
## [5] " Experience using SparkML and other ML libraries such as scikit-learn, caret, mlr, MLlib"
## [6] " Experience manipulating and transforming large datasets"
## [7] " Hands-on comfort with a subset of SQL, Hadoop ecosystem (Hive, Spark, etc.), NoSQL, Key/Value stores, document stores"
## [8] " Experience in supporting internal and external customers. You understand what it means to draw out critical customer needs and focus your knowledge and creativity to deliver practical outcomes addressing those needs.In addition, you should have familiarity with information security and/or cloud services and be excited about developing these skills further:Information Security:"
## [9] " Commercial security solutions such as web application firewalls, IDS/IPS, SIEM, DLP, DDOS mitigation"
## [10] " Experience automating IT & security tasks"
## [11] " Building security reference architecture for cloud deployments and hybrid scenarios"
## [12] " Implementation experience with enterprise security solutions such as WAF, IPS, Anti-DDOS, and SIEMCloud Services:"
## [13] " Experience handling terabyte size datasets"
##
## [[1]][[23]][[2]]
## [1] ""
## [2] " Track record of diving into data to discover hidden patterns"
## [3] " Strong troubleshooting and problem-solving skills"
## [4] " Effective communication and strong collaboration skillsInformation Security"
## [5] " Understanding of enterprise risk management methods and techniques to drive successful outcomes in a multi-national environment"
## [6] " Understanding architectural implications of meeting industry standards such as PCI DSS, ISO 27001, HIPAA, and NIST/DoD frameworks.Cloud Services"
## [7] " Experience with AWS Services"
## [8] " Working knowledge of cloud computing technologies and workload transition challenges"
## [9] " Familiarity with distributed computational approaches"
## [10] " Experience with scalable, distributed computing frameworks"
## [11] " Familiarity with archive, backup/recovery and business continuity processes in distributed operationsAmazon.com is an Equal Opportunity-Affirmative Action Employer <U+0096> Minority / Female / Disability / Veteran / Gender Identity / Sexual Orientationaws-proserv-na"
##
##
## [[1]][[24]]
## [1] "Minimum 5 years of Data Science experience"
##
## [[1]][[25]]
## [1] "At least 1 year of leadership experience required "
##
## [[1]][[26]]
## [1] "Machine Learning and Cyber Security experience"
##
## [[1]][[27]]
## [1] "Experience with ETL Pipelines"
##
## [[1]][[28]]
## [1] "NLP experience"
##
## [[1]][[29]]
## [1] "Experience or familiarity with Python, AWS, Scikit, Postgres, D3 and/or Scala"
##
## [[1]][[30]]
## [1] "Strong Written and Verbal communication a Must"
##
## [[1]][[31]]
## [1] "7+ years of overall IT engineering or architecture experience with a proven background in Cyber Security specific to:"
##
## [[1]][[32]]
## [1] "Data Protection - Data Loss Prevention (DLP), Encryption, Cryptography, Tokenization, Access Control, Data Classification, PKI or the supporting of these security solutions."
##
## [[1]][[33]]
## [1] "Extensive experience in a Red Hat Environment"
##
## [[1]][[34]]
## [1] "Extensive experience with networking protocols and concepts "
##
## [[1]][[35]]
## [1] "Experience with scripting languages such as Java, Shell, Python, or PowerShell"
##
## [[1]][[36]]
## [1] "Experience with large scale networks including Microsoft Exchange and Active Directory"
##
## [[1]][[37]]
## [1] "Ability to support and liaise with business process owners to incorporate data protection products and provisions into their processes."
##
## [[1]][[38]]
## [1] "Must be able to work collaboratively with other areas to advocate information security solutions."
##
## [[1]][[39]]
## [1] "Must possess a high degree of initiative, motivation, and problem-solving skills."
##
## [[1]][[40]]
## [1] "Ability to communicate security, data protection, data loss prevention related concepts to a broad range of technical and non-technical staff, including senior business leaders"
##
## [[1]][[41]]
## [1] "Data Loss Prevention concepts and products (such as Symantec DLP, Digital Guardian, RSA or Mcafee DLP, etc<U+0085>)"
##
## [[1]][[42]]
## [1] "Data encryption concepts and products (such as Vormetric, Protegrity, Voltage, etc<U+0085>)"
##
## [[1]][[43]]
## [1] "Data classification concepts and products (such as Titus, Varonis, etc<U+0085>)"
##
## [[1]][[44]]
## [1] "Tokenization, data masking, data dispersion techniques"
Clean_data <- read.csv(url("https://raw.githubusercontent.com/mikegankhuyag/607-Projects/master/Book2.csv"))
head(Clean_data)
## Industry Skill.Type Skill
## 1 Cyber Secuirty Programming/Technical Python
## 2 Cyber Secuirty Programming/Technical R
## 3 Cyber Secuirty Programming/Technical SQL
## 4 Cyber Secuirty Programming/Technical SPARKML
## 5 Cyber Secuirty Programming/Technical sckit
## 6 Cyber Secuirty Programming/Technical caret
Technical_Skills <- Clean_data[Clean_data$Skill.Type == "Programming/Technical",]
head(Technical_Skills)
## Industry Skill.Type Skill
## 1 Cyber Secuirty Programming/Technical Python
## 2 Cyber Secuirty Programming/Technical R
## 3 Cyber Secuirty Programming/Technical SQL
## 4 Cyber Secuirty Programming/Technical SPARKML
## 5 Cyber Secuirty Programming/Technical sckit
## 6 Cyber Secuirty Programming/Technical caret
Technical_Skills2 <- sort(table(Technical_Skills$Skill),decreasing = TRUE)
Technical_Skills3 <- data.frame(Technical_Skills2[1:10])
library(ggplot2)
## Warning: package 'ggplot2' was built under R version 3.4.2
ggplot(Technical_Skills3, aes(x = Technical_Skills3$Var1, y = Technical_Skills3$Freq, fill = Technical_Skills3$Freq)) +
geom_bar(stat="identity", color="black ")+
theme_minimal()+
ggtitle("Top Technical Data Science Skills in Cyber Security")+
xlab("Skills") +
ylab("Frequency") +
theme(axis.text.x = element_text(angle = 70, hjust = 1),legend.position = "none", panel.background = element_rect(fill="gray", colour = "lightblue"))
Overall <- sort(table(Clean_data$Skill),decreasing = TRUE)
Overall_top10 <- data.frame(Overall[1:10])
Overall_top10
## Var1 Freq
## 1 Python 4
## 2 Software Development 3
## 3 SQL 3
## 4 Developing models 2
## 5 ETL Techniques 2
## 6 Good communication 2
## 7 Meeting deadlines 2
## 8 Network Protocals 2
## 9 Problem solving 2
## 10 R 2
ggplot(Overall_top10, aes(x = Overall_top10$Var1, y = Overall_top10$Freq, fill = Overall_top10$Freq)) +
geom_bar(stat="identity", color="black ")+
theme_minimal()+
ggtitle("Top 10 Data Science Skills in Cyber Security")+
xlab("Skills") +
ylab("Frequency") +
theme(axis.text.x = element_text(angle = 70, hjust = 1),legend.position = "none", panel.background = element_rect(fill="gray", colour = "lightblue"))