namespace :one_off do task add_dese_ids: :environment do all_schools = School.all.includes(:district) updated_schools = [] qualtrics_schools = {} csv_file = Rails.root.join('data', 'master_list_of_schools_and_districts.csv') CSV.parse(File.read(csv_file), headers: true) do |row| district_id = row['District Code'].to_i school_id = row['School Code'].to_i if qualtrics_schools[[district_id, school_id]].present? puts "Duplicate entry row #{row}" next end qualtrics_schools[[district_id, school_id]] = row end qualtrics_schools.each do |(district_id, school_id), csv_row| school = all_schools.find do |school| school.qualtrics_code == school_id && school.district.qualtrics_code == district_id end if school.nil? school_name = csv_row['School Name'].strip puts "Could not find school '#{school_name}' with district id: #{district_id}, school id: #{school_id}" potential_school_ids = School.where('name like ?', "%#{school_name}%").map(&:id) puts "Potential ID matches: #{potential_school_ids}" if potential_school_ids.present? next end school.update!(dese_id: csv_row['DESE School ID']) updated_schools << school.id end School.where.not(id: updated_schools).each do |school| puts "School with unchanged DESE id: #{school.name}, id: #{school.id}" end end desc 'list scales that have no survey responses' task list_scales_that_lack_survey_responses: :environment do output = AcademicYear.all.map do |academic_year| Scale.all.map do |scale| [academic_year.range, scale.scale_id, scale.survey_item_responses.where(academic_year:).count] end end output = output.map { |year| year.reject { |scale| scale[2] > 0 || scale[1].starts_with?('a-') } } pp output end desc 'list survey_items that have no survey responses by district' task list_survey_items_that_lack_responses: :environment do output = AcademicYear.all.map do |academic_year| District.all.map do |district| SurveyItem.all.map do |survey_item| [academic_year.range, survey_item.survey_item_id, survey_item.survey_item_responses.joins(:school).where("school.district": district, academic_year:).count, district.name] end end end output = output.map do |year| year.map do |district| district.reject do |survey_item| survey_item[2] > 0 || survey_item[1].starts_with?('a-') end end end pp output end desc 'list the most recent admin data values' task list_recent_admin_data_values: :environment do range = 4.weeks.ago..1.second.ago values = AdminDataValue.where(updated_at: range).group(:admin_data_item).count.map do |item| [item[0].admin_data_item_id, item[0].scale.measure.measure_id] end puts values end desc 'load survey responses for lowell schools' task load_survey_responses_for_lowell: :environment do survey_item_response_count = SurveyItemResponse.count student_count = Student.count Sftp::Directory.open(path: '/test/survey_responses/') do |file| SurveyResponsesDataLoader.from_file(file:) end puts "=====================> Completed loading #{SurveyItemResponse.count - survey_item_response_count} survey responses. #{SurveyItemResponse.count} total responses in the database" Sftp::Directory.open(path: '/test/survey_responses/') do |file| StudentLoader.from_file(file:, rules: [Rule::SkipNonLowellSchools]) end puts "=====================> Completed loading #{Student.count - student_count} students. #{Student.count} total students" puts 'Resetting race scores' RaceScoreLoader.reset(fast_processing: false) puts "=====================> Completed loading #{RaceScore.count} race scores" Rails.cache.clear end desc 'delete 2022-23 survey responses' task delete_survey_responses_2022_23: :environment do response_count = SurveyItemResponse.all.count SurveyItemResponse.where(academic_year: AcademicYear.find_by_range('2022-23')).delete_all puts "=====================> Deleted #{response_count - SurveyItemResponse.all.count} survey responses" # should be somewhere near 295738 end desc 'delete 2023-24 survey responses' task delete_survey_responses_2023_24: :environment do response_count = SurveyItemResponse.all.count SurveyItemResponse.where(academic_year: AcademicYear.find_by_range('2023-24')).delete_all puts "=====================> Deleted #{response_count - SurveyItemResponse.all.count} survey responses" end desc 'load survey responses for lowell schools 2022-23' task load_survey_responses_for_lowell_2022_23: :environment do survey_item_response_count = SurveyItemResponse.count student_count = Student.count path = '/data/survey_responses/2022-23/' Sftp::Directory.open(path:) do |file| SurveyResponsesDataLoader.from_file(file:) end puts "=====================> Completed loading #{SurveyItemResponse.count - survey_item_response_count} survey responses. #{SurveyItemResponse.count} total responses in the database" Sftp::Directory.open(path:) do |file| StudentLoader.from_file(file:, rules: [Rule::SkipNonLowellSchools]) end puts "=====================> Completed loading #{Student.count - student_count} students. #{Student.count} total students" puts 'Resetting race scores' RaceScoreLoader.reset(fast_processing: false, academic_years: [AcademicYear.find_by_range('2022-23')]) puts "=====================> Completed loading #{RaceScore.count} race scores" Rails.cache.clear end desc 'delete errant response' task delete_responses: :environment do SurveyItemResponse.where(response_id: 'R_diYAw7qOj4W1UZ3').delete_all SurveyItemResponse.where(response_id: 'R_27fKhVfyeKGMF5q').delete_all SurveyItemResponse.where(response_id: 'R_2cjPX1Ngxr2Hc4c').delete_all end desc 'upload spring survey results to 23-24' task upload_spring23: :environment do new_files = Array.new input_filepath = Rails.root.join('tmp', 'data', 'rpp_data', 'clean') Dir.foreach(input_filepath) do |filename| next if filename.start_with?('.') # skip hidden files and ./.. directories # this can probably be replaced with Dir.join or similar input_filename = Rails.root.join('tmp', 'data', 'rpp_data', 'clean', filename).to_s sftptogo_url = ENV['SFTPTOGO_URL'] uri = URI.parse(sftptogo_url) Net::SFTP.start(uri.host, uri.user, password: uri.password) do |sftp| puts "Uploading #{filename}..." sftp.upload!(input_filename, "/data/survey_responses/2023-24/#{filename}") end new_files.append(filename) end # print remote directory contents with new files marked path = '/data/survey_responses/2023-24/' Sftp::Directory.open(path:) do |file| # the open method already prints all the contents... end end desc 'load spring survey responses' task load_spring_survey_responses: :environment do survey_item_response_count = SurveyItemResponse.count student_count = Student.count path = '/data/survey_responses/2023-24/' Sftp::Directory.open(path:) do |file| SurveyResponsesDataLoader.from_file(file:) end puts "=====================> Completed loading #{SurveyItemResponse.count - survey_item_response_count} survey responses" Sftp::Directory.open(path:) do |file| StudentLoader.from_file(file:, rules: [Rule::SkipNonLowellSchools]) end puts "=====================> Completed loading #{Student.count - student_count} students. #{Student.count} total students" puts 'Resetting race scores' RaceScoreLoader.reset(fast_processing: false) puts "=====================> Completed loading #{RaceScore.count} race scores" Rails.cache.clear end end