parent
725348bf95
commit
1810ee0074
@ -1,38 +1,40 @@
|
|||||||
require 'watir'
|
require "watir"
|
||||||
require 'csv'
|
require "csv"
|
||||||
|
|
||||||
module Dese
|
module Dashboard
|
||||||
module Enrollments
|
module Dese
|
||||||
include Dese::Scraper
|
module Enrollments
|
||||||
attr_reader :filepaths
|
include Dashboard::Dese::Scraper
|
||||||
|
attr_reader :filepaths
|
||||||
|
|
||||||
def scrape_enrollments(filepath:)
|
def scrape_enrollments(filepath:)
|
||||||
headers = ['Raw likert calculation', 'Likert Score', 'Admin Data Item', 'Academic Year', 'School Name', 'DESE ID',
|
headers = ["Raw likert calculation", "Likert Score", "Admin Data Item", "Academic Year", "School Name", "DESE ID",
|
||||||
'PK', 'K', '1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11', '12', 'SP', 'Total']
|
"PK", "K", "1", "2", "3", "4", "5", "6", "7", "8", "9", "10", "11", "12", "SP", "Total"]
|
||||||
write_headers(filepath:, headers:)
|
write_headers(filepath:, headers:)
|
||||||
run do |academic_year|
|
run do |academic_year|
|
||||||
admin_data_item_id = ''
|
admin_data_item_id = ""
|
||||||
url = 'https://profiles.doe.mass.edu/statereport/enrollmentbygrade.aspx'
|
url = "https://profiles.doe.mass.edu/statereport/enrollmentbygrade.aspx"
|
||||||
range = academic_year.range
|
range = academic_year.range
|
||||||
selectors = { 'ctl00_ContentPlaceHolder1_ddReportType' => 'School',
|
selectors = { "ctl00_ContentPlaceHolder1_ddReportType" => "School",
|
||||||
'ctl00_ContentPlaceHolder1_ddYear' => range }
|
"ctl00_ContentPlaceHolder1_ddYear" => range }
|
||||||
submit_id = 'btnViewReport'
|
submit_id = "btnViewReport"
|
||||||
calculation = ->(_headers, _items) { 'NA' }
|
calculation = ->(_headers, _items) { "NA" }
|
||||||
Prerequisites.new(filepath, url, selectors, submit_id, admin_data_item_id, calculation)
|
Prerequisites.new(filepath, url, selectors, submit_id, admin_data_item_id, calculation)
|
||||||
|
end
|
||||||
end
|
end
|
||||||
end
|
|
||||||
|
|
||||||
def student_count(filepath:, dese_id:, year:)
|
def student_count(filepath:, dese_id:, year:)
|
||||||
@students ||= {}
|
@students ||= {}
|
||||||
if @students.count == 0
|
if @students.count == 0
|
||||||
CSV.parse(File.read(filepath), headers: true).map do |row|
|
CSV.parse(File.read(filepath), headers: true).map do |row|
|
||||||
academic_year = row['Academic Year']
|
academic_year = row["Academic Year"]
|
||||||
school_id = row['DESE ID'].to_i
|
school_id = row["DESE ID"].to_i
|
||||||
total = row['Total'].gsub(',', '').to_i
|
total = row["Total"].gsub(",", "").to_i
|
||||||
@students[[school_id, academic_year]] = total
|
@students[[school_id, academic_year]] = total
|
||||||
|
end
|
||||||
end
|
end
|
||||||
|
@students[[dese_id, year]]
|
||||||
end
|
end
|
||||||
@students[[dese_id, year]]
|
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
|
|||||||
File diff suppressed because it is too large
Load Diff
File diff suppressed because it is too large
Load Diff
@ -0,0 +1,24 @@
|
|||||||
|
namespace :dashboard do
|
||||||
|
namespace :scrape do
|
||||||
|
desc "scrape dese site for admin data"
|
||||||
|
task admin: :environment do
|
||||||
|
puts "scraping data from dese"
|
||||||
|
scrapers = [Dese::OneAOne, Dese::OneAThree, Dese::TwoAOne, Dese::TwoCOne, Dese::ThreeAOne, Dese::ThreeATwo,
|
||||||
|
Dese::ThreeBOne, Dese::ThreeBTwo, Dese::FourAOne, Dese::FourBTwo, Dese::FourDOne, Dese::FiveCOne, Dese::FiveDTwo]
|
||||||
|
scrapers.each do |scraper|
|
||||||
|
scraper.new.run_all
|
||||||
|
end
|
||||||
|
end
|
||||||
|
|
||||||
|
desc "scrape dese site for teacher staffing information"
|
||||||
|
task enrollment: :environment do
|
||||||
|
Dese::ThreeATwo.new.scrape_enrollments(filepath: Dashboard::Engine.root.join("data", "dashboard", "enrollment",
|
||||||
|
"enrollment.csv"))
|
||||||
|
end
|
||||||
|
|
||||||
|
desc "scrape dese site for student staffing information"
|
||||||
|
task staffing: :environment do
|
||||||
|
Dashboard::Dese::Staffing.new.run_all
|
||||||
|
end
|
||||||
|
end
|
||||||
|
end
|
||||||
Loading…
Reference in new issue