Faster admin data loader + rename School.school_hash

This commit is contained in:
Gabe Farrell 2024-04-22 14:46:37 -04:00
parent 40aef35c2c
commit 6fac759ec2
7 changed files with 126 additions and 81 deletions

View file

@ -1,80 +1,100 @@
require "csv"
namespace :data do
desc "load survey responses"
task load_survey_responses: :environment do
namespace(:data) do
desc("load survey responses")
task(load_survey_responses: :environment) do
survey_item_response_count = SurveyItemResponse.count
student_count = Student.count
path = "/data/survey_responses/clean/"
Sftp::Directory.open(path:) do |file|
SurveyResponsesDataLoader.new.from_file(file:)
end
puts "=====================> Completed loading #{SurveyItemResponse.count} survey responses"
puts(
"=====================> Completed loading #{SurveyItemResponse.count - survey_item_response_count} survey responses. #{SurveyItemResponse.count} total responses in the database"
)
Rails.cache.clear
end
desc "load survey responses from a specific directory"
task load_survey_responses_from_path: :environment do
desc("load survey responses from a specific directory")
task(load_survey_responses_from_path: :environment) do
survey_item_response_count = SurveyItemResponse.count
student_count = Student.count
path = "#{ENV['SFTP_PATH']}"
path = "#{ENV["SFTP_PATH"]}"
Sftp::Directory.open(path:) do |file|
SurveyResponsesDataLoader.new.from_file(file:)
end
puts "=====================> Completed loading #{SurveyItemResponse.count - survey_item_response_count} survey responses. #{SurveyItemResponse.count} total responses in the database"
puts(
"=====================> Completed loading #{SurveyItemResponse.count - survey_item_response_count} survey responses. #{SurveyItemResponse.count} total responses in the database"
)
Rails.cache.clear
end
desc "reset response rate values"
task reset_response_rates: :environment do
puts "Resetting response rates"
desc("reset response rate values")
task(reset_response_rates: :environment) do
puts("Resetting response rates")
ResponseRateLoader.reset
Rails.cache.clear
puts "=====================> Completed loading #{ResponseRate.count} survey responses"
puts("=====================> Completed loading #{ResponseRate.count} survey responses")
end
desc "reset race score calculations"
task reset_race_scores: :environment do
puts "Resetting race scores"
desc("reset race score calculations")
task(reset_race_scores: :environment) do
puts("Resetting race scores")
RaceScoreLoader.reset(fast_processing: false)
Rails.cache.clear
puts "=====================> Completed loading #{RaceScore.count} survey responses"
puts("=====================> Completed loading #{RaceScore.count} survey responses")
end
desc "load admin_data"
task load_admin_data: :environment do
desc("load admin_data")
task(load_admin_data: :environment) do
original_count = AdminDataValue.count
pool_size = 2
jobs = Queue.new
Dir.glob(Rails.root.join("data", "admin_data", "dese", "*.csv")).each { |filepath| jobs << filepath }
while filepath = jobs.pop(true)
puts "=====================> Loading data from csv at path: #{filepath}"
Dese::Loader.load_data filepath:
workers = pool_size.times.map do
Thread.new do
while filepath = jobs.pop(true)
puts("=====================> Loading data from csv at path: #{filepath}")
Dese::Loader.load_data(filepath:)
end
rescue ThreadError
end
end
rescue ThreadError
puts "=====================> Completed loading #{AdminDataValue.count - original_count} admin data values"
workers.each(&:join)
puts("=====================> Completed loading #{AdminDataValue.count - original_count} admin data values")
end
desc "reset all cache counters"
task reset_cache_counters: :environment do
puts "=====================> Resetting Category counters"
desc("reset all cache counters")
task(reset_cache_counters: :environment) do
puts("=====================> Resetting Category counters")
Category.all.each do |category|
Category.reset_counters(category.id, :subcategories)
end
puts "=====================> Resetting Subcategory counters"
puts("=====================> Resetting Subcategory counters")
Subcategory.all.each do |subcategory|
Subcategory.reset_counters(subcategory.id, :measures)
end
puts "=====================> Resetting Measure counters"
puts("=====================> Resetting Measure counters")
Measure.all.each do |measure|
Measure.reset_counters(measure.id, :scales)
end
puts "=====================> Resetting Scale counters"
puts("=====================> Resetting Scale counters")
Scale.all.each do |scale|
Scale.reset_counters(scale.id, :survey_items)
end
puts "=====================> Resetting SurveyItem counters"
puts("=====================> Resetting SurveyItem counters")
SurveyItem.all.each do |survey_item|
SurveyItem.reset_counters(survey_item.id, :survey_item_responses)
end