You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
134 lines
5.5 KiB
134 lines
5.5 KiB
require 'watir'
|
|
require 'csv'
|
|
|
|
module Dese
|
|
class ThreeBTwo
|
|
include Dese::Scraper
|
|
include Dese::Enrollments
|
|
attr_reader :filepaths
|
|
|
|
def initialize(filepaths: [Rails.root.join('data', 'admin_data', 'dese', '3B_2_enrollments.csv'),
|
|
Rails.root.join('data', 'admin_data', 'dese', '3B_2_teacher_by_race_and_gender.csv'),
|
|
Rails.root.join('data', 'admin_data', 'dese', '3B_2_student_by_race_and_gender.csv')])
|
|
@filepaths = filepaths
|
|
end
|
|
|
|
def run_all
|
|
# filepath = filepaths[0]
|
|
# scrape_enrollments(filepath:)
|
|
|
|
filepath = filepaths[1]
|
|
headers = ['Raw likert calculation', 'Likert Score', 'Admin Data Item', 'Academic Year', 'Teachers of color (%)', 'School Name', 'DESE ID',
|
|
'African American (%)', 'Asian (%)', 'Hispanic (%)', 'White (%)', 'Native American (%)',
|
|
'Native Hawaiian Pacific Islander (%)', 'Multi-Race Non-Hispanic (%)', 'Females (%)',
|
|
'Males (%)', 'FTE Count']
|
|
write_headers(filepath:, headers:)
|
|
run_teacher_demographics(filepath:)
|
|
|
|
filepath = filepaths[2]
|
|
headers = ['Raw likert calculation', 'Likert Score', 'Admin Data Item', 'Academic Year', 'Non-White Teachers %', 'Non-White Students %', 'School Name', 'DESE ID',
|
|
'African American', 'Asian', 'Hispanic', 'White', 'Native American',
|
|
'Native Hawaiian or Pacific Islander', 'Multi-Race or Non-Hispanic', 'Males',
|
|
'Females', 'Non-Binary', 'Students of color (%)']
|
|
write_headers(filepath:, headers:)
|
|
run_student_demographics(filepath:)
|
|
|
|
browser.close
|
|
end
|
|
|
|
def run_teacher_demographics(filepath:)
|
|
run do |academic_year|
|
|
admin_data_item_id = ''
|
|
url = 'https://profiles.doe.mass.edu/statereport/teacherbyracegender.aspx'
|
|
range = academic_year.range
|
|
selectors = { 'ctl00_ContentPlaceHolder1_ddReportType' => 'School',
|
|
'ctl00_ContentPlaceHolder1_ddYear' => range,
|
|
'ctl00_ContentPlaceHolder1_ddDisplay' => 'Percentages',
|
|
'ctl00_ContentPlaceHolder1_ddClassification' => 'Teacher' }
|
|
submit_id = 'ctl00_ContentPlaceHolder1_btnViewReport'
|
|
calculation = lambda { |headers, items|
|
|
african_american_index = headers['African American (%)']
|
|
african_american_number = items[african_american_index].to_f
|
|
|
|
asian_index = headers['Asian (%)']
|
|
asian_number = items[asian_index].to_f
|
|
|
|
hispanic_index = headers['Hispanic (%)']
|
|
hispanic_number = items[hispanic_index].to_f
|
|
|
|
native_american_index = headers['Native American (%)']
|
|
native_american_number = items[native_american_index].to_f
|
|
|
|
native_hawaiian_index = headers['Native Hawaiian, Pacific Islander (%)']
|
|
native_hawaiian_number = items[native_hawaiian_index].to_f
|
|
|
|
multi_race_index = headers['Multi-Race,Non-Hispanic (%)']
|
|
multi_race_number = items[multi_race_index].to_f
|
|
|
|
non_white_teachers = african_american_number + asian_number + hispanic_number + native_american_number + native_hawaiian_number + multi_race_number
|
|
items.unshift(non_white_teachers)
|
|
|
|
non_white_teachers
|
|
}
|
|
Prerequisites.new(filepath, url, selectors, submit_id, admin_data_item_id, calculation)
|
|
end
|
|
end
|
|
|
|
def teacher_count(filepath:, dese_id:, year:)
|
|
@teachers ||= {}
|
|
@years_with_data ||= Set.new
|
|
if @teachers.count == 0
|
|
CSV.parse(File.read(filepath), headers: true).map do |row|
|
|
academic_year = row['Academic Year']
|
|
@years_with_data << academic_year
|
|
school_id = row['DESE ID'].to_i
|
|
total = row['Teachers of color (%)'].gsub(',', '')
|
|
total = 'NA' if total == '' || total.nil?
|
|
@teachers[[school_id, academic_year]] = total
|
|
end
|
|
end
|
|
return 'NA' unless @years_with_data.include? year
|
|
|
|
@teachers[[dese_id, year]]
|
|
end
|
|
|
|
def run_student_demographics(filepath:)
|
|
run do |academic_year|
|
|
admin_data_item_id = 'a-cure-i1'
|
|
url = 'https://profiles.doe.mass.edu/statereport/enrollmentbyracegender.aspx'
|
|
range = academic_year.range
|
|
|
|
selectors = { 'ctl00_ContentPlaceHolder1_ddReportType' => 'School',
|
|
'ctl00_ContentPlaceHolder1_ddYear' => range }
|
|
submit_id = 'btnViewReport'
|
|
calculation = lambda { |headers, items|
|
|
white_index = headers['White']
|
|
white_number = items[white_index].to_f
|
|
dese_id = items[headers['School Code']].to_i
|
|
non_white_student_percentage = (100 - white_number).to_f
|
|
items.unshift(non_white_student_percentage)
|
|
count_of_teachers = teacher_count(filepath: filepaths[1], dese_id:, year: academic_year.range)
|
|
return 'NA' if count_of_teachers == 'NA'
|
|
|
|
non_white_teacher_percentage = count_of_teachers.to_f
|
|
items.unshift(non_white_teacher_percentage)
|
|
|
|
floor = 5
|
|
benchmark = 0.25
|
|
|
|
return 1 if non_white_student_percentage.zero? && non_white_teacher_percentage < floor
|
|
|
|
if non_white_teacher_percentage >= floor
|
|
parity_index = non_white_teacher_percentage / non_white_student_percentage
|
|
likert_score = parity_index * 4 / benchmark
|
|
else
|
|
likert_score = 1
|
|
end
|
|
likert_score
|
|
}
|
|
Prerequisites.new(filepath, url, selectors, submit_id, admin_data_item_id, calculation)
|
|
end
|
|
end
|
|
end
|
|
end
|