namespace :one_off do task add_dese_ids: :environment do all_schools = School.all.includes(:district) updated_schools = [] qualtrics_schools = {} csv_file = Rails.root.join("data", "master_list_of_schools_and_districts.csv") CSV.parse(File.read(csv_file), headers: true) do |row| district_id = row["District Code"].to_i school_id = row["School Code"].to_i if qualtrics_schools[[district_id, school_id]].present? puts "Duplicate entry row #{row}" next end qualtrics_schools[[district_id, school_id]] = row end qualtrics_schools.each do |(district_id, school_id), csv_row| school = all_schools.find do |school| school.qualtrics_code == school_id && school.district.qualtrics_code == district_id end if school.nil? school_name = csv_row["School Name"].strip puts "Could not find school '#{school_name}' with district id: #{district_id}, school id: #{school_id}" potential_school_ids = School.where("name like ?", "%#{school_name}%").map(&:id) puts "Potential ID matches: #{potential_school_ids}" if potential_school_ids.present? next end school.update!(dese_id: csv_row["DESE School ID"]) updated_schools << school.id end School.where.not(id: updated_schools).each do |school| puts "School with unchanged DESE id: #{school.name}, id: #{school.id}" end end desc "list scales that have no survey responses" task list_scales_that_lack_survey_responses: :environment do output = AcademicYear.all.map do |academic_year| Scale.all.map do |scale| [academic_year.range, scale.scale_id, scale.survey_item_responses.where(academic_year:).count] end end output = output.map { |year| year.reject { |scale| scale[2] > 0 || scale[1].starts_with?("a-") } } pp output end desc "list survey_items that have no survey responses by district" task list_survey_items_that_lack_responses: :environment do output = AcademicYear.all.map do |academic_year| District.all.map do |district| SurveyItem.all.map do |survey_item| [academic_year.range, survey_item.survey_item_id, survey_item.survey_item_responses.joins(:school).where("school.district": district, academic_year:).count, district.name] end end end output = output.map do |year| year.map do |district| district.reject do |survey_item| survey_item[2] > 0 || survey_item[1].starts_with?("a-") end end end pp output end desc "list the most recent admin data values" task list_recent_admin_data_values: :environment do range = 4.weeks.ago..1.second.ago values = AdminDataValue.where(updated_at: range).group(:admin_data_item).count.map do |item| [item[0].admin_data_item_id, item[0].scale.measure.measure_id] end puts values end desc "delete 2022-23 survey responses" task delete_survey_responses_2022_23: :environment do response_count = SurveyItemResponse.all.count SurveyItemResponse.where(academic_year: AcademicYear.find_by_range("2022-23")).delete_all puts "=====================> Deleted #{response_count - SurveyItemResponse.all.count} survey responses" # should be somewhere near 295738 end desc "load survey responses" task load_survey_responses: :environment do survey_item_response_count = SurveyItemResponse.count student_count = Student.count path = "/data/survey_responses/clean/" schools = District.find_by_slug("maynard-public-schools").schools Sftp::Directory.open(path:) do |file| SurveyResponsesDataLoader.new.from_file(file:) end puts "=====================> Completed loading #{SurveyItemResponse.count - survey_item_response_count} survey responses. #{SurveyItemResponse.count} total responses in the database" Rails.cache.clear end desc "delete 2023-24 data" task delete_2023_24_data: :environment do academic_year = AcademicYear.find_by_range "2023-24" SurveyItemResponse.where(academic_year:).delete_all Respondent.where(academic_year:).delete_all Rails.application.load_seed end desc "delete last year of respondent data and reseed numbers" task reseed_respondents: :environment do Respondent.delete_all seeder = Seeder.new seeder.seed_enrollment Rails.root.join("data", "enrollment", "enrollment.csv") seeder.seed_enrollment Rails.root.join("data", "enrollment", "nj_enrollment.csv") seeder.seed_enrollment Rails.root.join("data", "enrollment", "wi_enrollment.csv") seeder.seed_staffing Rails.root.join("data", "staffing", "staffing.csv") seeder.seed_staffing Rails.root.join("data", "staffing", "nj_staffing.csv") seeder.seed_staffing Rails.root.join("data", "staffing", "wi_staffing.csv") end desc "delete 2022-24 AcademicYear and all responses, admin data, enrollment numbers and staffing numbers" task delete_2022_24: :environment do academic_years = AcademicYear.where(range: ["2022-23", "2023-24", "2024-25", "2022-23 Fall", "2022-23 Spring", "2023-24 Fall", "2023-24 Spring"]) academic_years.each do |academic_year| AdminDataValue.where(academic_year:).delete_all Respondent.where(academic_year:).delete_all SurveyItemResponse.where(academic_year:).delete_all academic_year.delete end end desc "print out percentage of nil values for range" task nil_grades: :environment do AcademicYear.all.each do |academic_year| School.all.each do |school| total = SurveyItemResponse.where(school:, academic_year:, survey_item: SurveyItem.student_survey_items).count.to_f nil_count = SurveyItemResponse.where(school:, academic_year:, grade: nil, survey_item: SurveyItem.student_survey_items).count percentage = ((nil_count / total) * 100).round(1) puts "#{percentage}% nil grades for: #{school.name}, #{academic_year.range}" if percentage > 1 end end end end