Commit 6d2cf16ad6630bf7145c0e7a2c9d6b78f0d66e67
1 parent
55041d0f
Exists in
master
and in
1 other branch
move bunch of items from test_api to prune_db
Showing
2 changed files
with
233 additions
and
219 deletions
Show diff stats
lib/tasks/prune_db.rake
@@ -17,6 +17,223 @@ namespace :prune_db do | @@ -17,6 +17,223 @@ namespace :prune_db do | ||
17 | end | 17 | end |
18 | end | 18 | end |
19 | 19 | ||
20 | + desc "Generate appearances for any votes that have no current appearance, should only need to be run once" | ||
21 | + task(:generate_appearances_for_existing_votes => :environment) do | ||
22 | + votes = Vote.all | ||
23 | + | ||
24 | + count = 0 | ||
25 | + votes.each do |v| | ||
26 | + if v.appearance.nil? | ||
27 | + print "." | ||
28 | + a = Appearance.create(:voter_id => v.voter_id, :site_id => v.site_id, :prompt_id => v.prompt_id, :question_id => v.question_id, :created_at => v.created_at, :updated_at => v.updated_at) | ||
29 | + v.appearance = a | ||
30 | + v.save | ||
31 | + | ||
32 | + count += 1 | ||
33 | + end | ||
34 | + end | ||
35 | + | ||
36 | + print count | ||
37 | + end | ||
38 | + | ||
39 | + desc "Don't run unless you know what you are doing" | ||
40 | + task(:generate_lots_of_votes => :environment) do | ||
41 | + if Rails.env.production? | ||
42 | + print "You probably don't want to run this in production as it will falsify a bunch of random votes" | ||
43 | + end | ||
44 | + | ||
45 | + | ||
46 | + current_user = User.first | ||
47 | + 1000.times do |n| | ||
48 | + puts "#{n} votes completed" if n % 100 == 0 | ||
49 | + question = Question.find(214) # test question change as needed | ||
50 | + @prompt = question.catchup_choose_prompt(1).first | ||
51 | + @appearance = current_user.record_appearance(current_user.default_visitor, @prompt) | ||
52 | + | ||
53 | + direction = (rand(2) == 0) ? "left" : "right" | ||
54 | + current_user.record_vote(:prompt => @prompt, :direction => direction, :appearance_lookup => @appearance.lookup) | ||
55 | + end | ||
56 | + | ||
57 | + end | ||
58 | + | ||
59 | + desc "Dump votes of a question by left vs right id" | ||
60 | + task(:make_csv => :environment) do | ||
61 | + | ||
62 | + q = Question.find(214) | ||
63 | + | ||
64 | + | ||
65 | + the_prompts = q.prompts_hash_by_choice_ids | ||
66 | + | ||
67 | + #hash_of_choice_ids_from_left_to_right_to_votes | ||
68 | + the_hash = {} | ||
69 | + q.choices.each do |l| | ||
70 | + q.choices.each do |r| | ||
71 | + next if l.id == r.id | ||
72 | + | ||
73 | + if not the_hash.has_key?(l.id) | ||
74 | + the_hash[l.id] = {} | ||
75 | + the_hash[l.id][l.id] = 0 | ||
76 | + end | ||
77 | + | ||
78 | + p = the_prompts["#{l.id}, #{r.id}"] | ||
79 | + if p.nil? | ||
80 | + the_hash[l.id][r.id] = 0 | ||
81 | + else | ||
82 | + the_hash[l.id][r.id] = p.appearances.size | ||
83 | + end | ||
84 | + end | ||
85 | + end | ||
86 | + | ||
87 | + the_hash.sort.each do |xval, row| | ||
88 | + rowarray = [] | ||
89 | + row.sort.each do |yval, cell| | ||
90 | + rowarray << cell | ||
91 | + end | ||
92 | + puts rowarray.join(", ") | ||
93 | + end | ||
94 | + end | ||
95 | + | ||
96 | + desc "Should only need to be run once" | ||
97 | + task(:generate_all_possible_prompts => :environment) do | ||
98 | + Question.find(:all).each do |q| | ||
99 | + choices = q.choices | ||
100 | + if q.prompts.size > choices.size**2 - choices.size | ||
101 | + print "ERROR: #{q.id}\n" | ||
102 | + next | ||
103 | + elsif q.prompts.size == choices.size**2 - choices.size | ||
104 | + print "#{q.id} has enough prompts, skipping...\n" | ||
105 | + next | ||
106 | + else | ||
107 | + print "#{q.id} should add #{(choices.size ** 2 - choices.size) - q.prompts.size}\n" | ||
108 | + | ||
109 | + end | ||
110 | + created_timestring = q.created_at.to_s(:db) | ||
111 | + updated_timestring = Time.now.to_s(:db) #isn't rails awesome? | ||
112 | + promptscount=0 | ||
113 | + inserts = [] | ||
114 | + the_prompts = Prompt.find(:all, :select => 'id, left_choice_id, right_choice_id', :conditions => {:question_id => q.id}) | ||
115 | + | ||
116 | + the_prompts_hash = {} | ||
117 | + the_prompts.each do |p| | ||
118 | + the_prompts_hash["#{p.left_choice_id},#{p.right_choice_id}"] = 1 | ||
119 | + end | ||
120 | + | ||
121 | + choices.each do |l| | ||
122 | + choices.each do |r| | ||
123 | + if l.id == r.id | ||
124 | + next | ||
125 | + else | ||
126 | + #p = the_prompts.find{|o| o.left_choice_id == l.id && o.right_choice_id == r.id} | ||
127 | + keystring = "#{l.id},#{r.id}" | ||
128 | + p = the_prompts_hash[keystring] | ||
129 | + if p.nil? | ||
130 | + inserts.push("(NULL, #{q.id}, NULL, #{l.id}, '#{created_timestring}', '#{updated_timestring}', NULL, 0, #{r.id}, NULL, NULL)") | ||
131 | + promptscount+=1 | ||
132 | + end | ||
133 | + | ||
134 | + end | ||
135 | + | ||
136 | + end | ||
137 | + end | ||
138 | + | ||
139 | + print "Added #{promptscount} to #{q.id}\n" | ||
140 | + sql = "INSERT INTO `prompts` (`algorithm_id`, `question_id`, `voter_id`, `left_choice_id`, `created_at`, `updated_at`, `tracking`, `votes_count`, `right_choice_id`, `active`, `randomkey`) VALUES #{inserts.join(', ')}" | ||
141 | + unless inserts.empty? | ||
142 | + ActiveRecord::Base.connection.execute(sql) | ||
143 | + end | ||
144 | + | ||
145 | + Question.update_counters(q.id, :prompts_count => promptscount) | ||
146 | + | ||
147 | + | ||
148 | + end | ||
149 | + | ||
150 | + | ||
151 | + | ||
152 | + end | ||
153 | + | ||
154 | + | ||
155 | + | ||
156 | + desc "Generate past density information" | ||
157 | + task(:generate_past_densities => :environment) do | ||
158 | + #this is not elegant, but should only be run once, so quick and dirty wins | ||
159 | + | ||
160 | + start_date = Vote.find(:all, :conditions => 'loser_choice_id IS NOT NULL', :order => :created_at, :limit => 1).first.created_at.to_date | ||
161 | + start_date.upto(Date.today) do |the_date| | ||
162 | + questions = Question.find(:all, :conditions => ['created_at < ?', the_date]) | ||
163 | + | ||
164 | + print the_date.to_s | ||
165 | + questions.each do |q| | ||
166 | + puts q.id | ||
167 | + relevant_choices = q.choices.find(:all, :conditions => ['created_at < ?', the_date]) | ||
168 | + | ||
169 | + seed_choices = 0 | ||
170 | + | ||
171 | + if relevant_choices == 0 | ||
172 | + next | ||
173 | + #this question had not been created yet | ||
174 | + end | ||
175 | + | ||
176 | + relevant_choices.each do |c| | ||
177 | + if !c.user_created | ||
178 | + seed_choices+=1 | ||
179 | + end | ||
180 | + | ||
181 | + end | ||
182 | + | ||
183 | + nonseed_choices = relevant_choices.size - seed_choices | ||
184 | + | ||
185 | + seed_seed_total = seed_choices **2 - seed_choices | ||
186 | + nonseed_nonseed_total = nonseed_choices **2 - nonseed_choices | ||
187 | + seed_nonseed_total = seed_choices * nonseed_choices | ||
188 | + nonseed_seed_total = seed_choices * nonseed_choices | ||
189 | + | ||
190 | + seed_seed_sum = 0 | ||
191 | + seed_nonseed_sum= 0 | ||
192 | + nonseed_seed_sum= 0 | ||
193 | + nonseed_nonseed_sum= 0 | ||
194 | + | ||
195 | + q.appearances.find_each(:conditions => ['prompt_id IS NOT NULL AND created_at < ?', the_date]) do |a| | ||
196 | + | ||
197 | + p = a.prompt | ||
198 | + if p.left_choice.user_created == false && p.right_choice.user_created == false | ||
199 | + seed_seed_sum += 1 | ||
200 | + elsif p.left_choice.user_created == false && p.right_choice.user_created == true | ||
201 | + seed_nonseed_sum += 1 | ||
202 | + elsif p.left_choice.user_created == true && p.right_choice.user_created == false | ||
203 | + nonseed_seed_sum += 1 | ||
204 | + elsif p.left_choice.user_created == true && p.right_choice.user_created == true | ||
205 | + nonseed_nonseed_sum += 1 | ||
206 | + end | ||
207 | + end | ||
208 | + | ||
209 | + densities = {} | ||
210 | + densities[:seed_seed] = seed_seed_sum.to_f / seed_seed_total.to_f | ||
211 | + densities[:seed_nonseed] = seed_nonseed_sum.to_f / seed_nonseed_total.to_f | ||
212 | + densities[:nonseed_seed] = nonseed_seed_sum.to_f / nonseed_seed_total.to_f | ||
213 | + densities[:nonseed_nonseed] = nonseed_nonseed_sum.to_f / nonseed_nonseed_total.to_f | ||
214 | + | ||
215 | + densities.each do |type, average| | ||
216 | + d = Density.new | ||
217 | + d.created_at = the_date | ||
218 | + d.question_id = q.id | ||
219 | + d.prompt_type = type.to_s | ||
220 | + d.value = average.nan? ? nil : average | ||
221 | + d.save! | ||
222 | + end | ||
223 | + | ||
224 | + puts "Seed_seed sum: #{seed_seed_sum}, seed_seed total num: #{seed_seed_total}" | ||
225 | + puts "Seed_nonseed sum: #{seed_nonseed_sum}, seed_nonseed total num: #{seed_nonseed_total}" | ||
226 | + puts "Nonseed_seed sum: #{nonseed_seed_sum}, nonseed_seed total num: #{nonseed_seed_total}" | ||
227 | + puts "Nonseed_nonseed sum: #{nonseed_nonseed_sum}, nonseed_nonseed total num: #{nonseed_nonseed_total}" | ||
228 | + | ||
229 | + | ||
230 | + end | ||
231 | + | ||
232 | + end | ||
233 | + | ||
234 | + end | ||
235 | + | ||
236 | + | ||
20 | desc "Invalidates votes with bad response times" | 237 | desc "Invalidates votes with bad response times" |
21 | task :invalidate_votes_with_bad_response_times => :environment do | 238 | task :invalidate_votes_with_bad_response_times => :environment do |
22 | badvotes = [] | 239 | badvotes = [] |
lib/tasks/test_api.rake
@@ -68,223 +68,6 @@ namespace :test_api do | @@ -68,223 +68,6 @@ namespace :test_api do | ||
68 | return error_message.blank? ? [success_message, false] : [error_message, true] | 68 | return error_message.blank? ? [success_message, false] : [error_message, true] |
69 | end | 69 | end |
70 | 70 | ||
71 | - desc "Don't run unless you know what you are doing" | ||
72 | - task(:generate_lots_of_votes => :environment) do | ||
73 | - if Rails.env.production? | ||
74 | - print "You probably don't want to run this in production as it will falsify a bunch of random votes" | ||
75 | - end | ||
76 | - | ||
77 | - | ||
78 | - current_user = User.first | ||
79 | - 1000.times do |n| | ||
80 | - puts "#{n} votes completed" if n % 100 == 0 | ||
81 | - question = Question.find(214) # test question change as needed | ||
82 | - @prompt = question.catchup_choose_prompt(1).first | ||
83 | - @appearance = current_user.record_appearance(current_user.default_visitor, @prompt) | ||
84 | - | ||
85 | - direction = (rand(2) == 0) ? "left" : "right" | ||
86 | - current_user.record_vote(:prompt => @prompt, :direction => direction, :appearance_lookup => @appearance.lookup) | ||
87 | - end | ||
88 | - | ||
89 | - end | ||
90 | - | ||
91 | - desc "Generate appearances for any votes that have no current appearance, should only need to be run once" | ||
92 | - task(:generate_appearances_for_existing_votes => :environment) do | ||
93 | - votes = Vote.all | ||
94 | - | ||
95 | - count = 0 | ||
96 | - votes.each do |v| | ||
97 | - if v.appearance.nil? | ||
98 | - print "." | ||
99 | - a = Appearance.create(:voter_id => v.voter_id, :site_id => v.site_id, :prompt_id => v.prompt_id, :question_id => v.question_id, :created_at => v.created_at, :updated_at => v.updated_at) | ||
100 | - v.appearance = a | ||
101 | - v.save | ||
102 | - | ||
103 | - count += 1 | ||
104 | - end | ||
105 | - end | ||
106 | - | ||
107 | - print count | ||
108 | - end | ||
109 | - | ||
110 | - | ||
111 | - desc "Generate past density information" | ||
112 | - task(:generate_past_densities => :environment) do | ||
113 | - #this is not elegant, but should only be run once, so quick and dirty wins | ||
114 | - | ||
115 | - start_date = Vote.find(:all, :conditions => 'loser_choice_id IS NOT NULL', :order => :created_at, :limit => 1).first.created_at.to_date | ||
116 | - start_date.upto(Date.today) do |the_date| | ||
117 | - questions = Question.find(:all, :conditions => ['created_at < ?', the_date]) | ||
118 | - | ||
119 | - print the_date.to_s | ||
120 | - questions.each do |q| | ||
121 | - puts q.id | ||
122 | - relevant_choices = q.choices.find(:all, :conditions => ['created_at < ?', the_date]) | ||
123 | - | ||
124 | - seed_choices = 0 | ||
125 | - | ||
126 | - if relevant_choices == 0 | ||
127 | - next | ||
128 | - #this question had not been created yet | ||
129 | - end | ||
130 | - | ||
131 | - relevant_choices.each do |c| | ||
132 | - if !c.user_created | ||
133 | - seed_choices+=1 | ||
134 | - end | ||
135 | - | ||
136 | - end | ||
137 | - | ||
138 | - nonseed_choices = relevant_choices.size - seed_choices | ||
139 | - | ||
140 | - seed_seed_total = seed_choices **2 - seed_choices | ||
141 | - nonseed_nonseed_total = nonseed_choices **2 - nonseed_choices | ||
142 | - seed_nonseed_total = seed_choices * nonseed_choices | ||
143 | - nonseed_seed_total = seed_choices * nonseed_choices | ||
144 | - | ||
145 | - seed_seed_sum = 0 | ||
146 | - seed_nonseed_sum= 0 | ||
147 | - nonseed_seed_sum= 0 | ||
148 | - nonseed_nonseed_sum= 0 | ||
149 | - | ||
150 | - q.appearances.find_each(:conditions => ['prompt_id IS NOT NULL AND created_at < ?', the_date]) do |a| | ||
151 | - | ||
152 | - p = a.prompt | ||
153 | - if p.left_choice.user_created == false && p.right_choice.user_created == false | ||
154 | - seed_seed_sum += 1 | ||
155 | - elsif p.left_choice.user_created == false && p.right_choice.user_created == true | ||
156 | - seed_nonseed_sum += 1 | ||
157 | - elsif p.left_choice.user_created == true && p.right_choice.user_created == false | ||
158 | - nonseed_seed_sum += 1 | ||
159 | - elsif p.left_choice.user_created == true && p.right_choice.user_created == true | ||
160 | - nonseed_nonseed_sum += 1 | ||
161 | - end | ||
162 | - end | ||
163 | - | ||
164 | - densities = {} | ||
165 | - densities[:seed_seed] = seed_seed_sum.to_f / seed_seed_total.to_f | ||
166 | - densities[:seed_nonseed] = seed_nonseed_sum.to_f / seed_nonseed_total.to_f | ||
167 | - densities[:nonseed_seed] = nonseed_seed_sum.to_f / nonseed_seed_total.to_f | ||
168 | - densities[:nonseed_nonseed] = nonseed_nonseed_sum.to_f / nonseed_nonseed_total.to_f | ||
169 | - | ||
170 | - densities.each do |type, average| | ||
171 | - d = Density.new | ||
172 | - d.created_at = the_date | ||
173 | - d.question_id = q.id | ||
174 | - d.prompt_type = type.to_s | ||
175 | - d.value = average.nan? ? nil : average | ||
176 | - d.save! | ||
177 | - end | ||
178 | - | ||
179 | - puts "Seed_seed sum: #{seed_seed_sum}, seed_seed total num: #{seed_seed_total}" | ||
180 | - puts "Seed_nonseed sum: #{seed_nonseed_sum}, seed_nonseed total num: #{seed_nonseed_total}" | ||
181 | - puts "Nonseed_seed sum: #{nonseed_seed_sum}, nonseed_seed total num: #{nonseed_seed_total}" | ||
182 | - puts "Nonseed_nonseed sum: #{nonseed_nonseed_sum}, nonseed_nonseed total num: #{nonseed_nonseed_total}" | ||
183 | - | ||
184 | - | ||
185 | - end | ||
186 | - | ||
187 | - end | ||
188 | - | ||
189 | - end | ||
190 | - | ||
191 | - | ||
192 | - desc "Should only need to be run once" | ||
193 | - task(:generate_all_possible_prompts => :environment) do | ||
194 | - Question.find(:all).each do |q| | ||
195 | - choices = q.choices | ||
196 | - if q.prompts.size > choices.size**2 - choices.size | ||
197 | - print "ERROR: #{q.id}\n" | ||
198 | - next | ||
199 | - elsif q.prompts.size == choices.size**2 - choices.size | ||
200 | - print "#{q.id} has enough prompts, skipping...\n" | ||
201 | - next | ||
202 | - else | ||
203 | - print "#{q.id} should add #{(choices.size ** 2 - choices.size) - q.prompts.size}\n" | ||
204 | - | ||
205 | - end | ||
206 | - created_timestring = q.created_at.to_s(:db) | ||
207 | - updated_timestring = Time.now.to_s(:db) #isn't rails awesome? | ||
208 | - promptscount=0 | ||
209 | - inserts = [] | ||
210 | - the_prompts = Prompt.find(:all, :select => 'id, left_choice_id, right_choice_id', :conditions => {:question_id => q.id}) | ||
211 | - | ||
212 | - the_prompts_hash = {} | ||
213 | - the_prompts.each do |p| | ||
214 | - the_prompts_hash["#{p.left_choice_id},#{p.right_choice_id}"] = 1 | ||
215 | - end | ||
216 | - | ||
217 | - choices.each do |l| | ||
218 | - choices.each do |r| | ||
219 | - if l.id == r.id | ||
220 | - next | ||
221 | - else | ||
222 | - #p = the_prompts.find{|o| o.left_choice_id == l.id && o.right_choice_id == r.id} | ||
223 | - keystring = "#{l.id},#{r.id}" | ||
224 | - p = the_prompts_hash[keystring] | ||
225 | - if p.nil? | ||
226 | - inserts.push("(NULL, #{q.id}, NULL, #{l.id}, '#{created_timestring}', '#{updated_timestring}', NULL, 0, #{r.id}, NULL, NULL)") | ||
227 | - promptscount+=1 | ||
228 | - end | ||
229 | - | ||
230 | - end | ||
231 | - | ||
232 | - end | ||
233 | - end | ||
234 | - | ||
235 | - print "Added #{promptscount} to #{q.id}\n" | ||
236 | - sql = "INSERT INTO `prompts` (`algorithm_id`, `question_id`, `voter_id`, `left_choice_id`, `created_at`, `updated_at`, `tracking`, `votes_count`, `right_choice_id`, `active`, `randomkey`) VALUES #{inserts.join(', ')}" | ||
237 | - unless inserts.empty? | ||
238 | - ActiveRecord::Base.connection.execute(sql) | ||
239 | - end | ||
240 | - | ||
241 | - Question.update_counters(q.id, :prompts_count => promptscount) | ||
242 | - | ||
243 | - | ||
244 | - end | ||
245 | - | ||
246 | - | ||
247 | - | ||
248 | - end | ||
249 | - | ||
250 | - | ||
251 | - desc "Dump votes of a question by left vs right id" | ||
252 | - task(:make_csv => :environment) do | ||
253 | - | ||
254 | - q = Question.find(214) | ||
255 | - | ||
256 | - | ||
257 | - the_prompts = q.prompts_hash_by_choice_ids | ||
258 | - | ||
259 | - #hash_of_choice_ids_from_left_to_right_to_votes | ||
260 | - the_hash = {} | ||
261 | - q.choices.each do |l| | ||
262 | - q.choices.each do |r| | ||
263 | - next if l.id == r.id | ||
264 | - | ||
265 | - if not the_hash.has_key?(l.id) | ||
266 | - the_hash[l.id] = {} | ||
267 | - the_hash[l.id][l.id] = 0 | ||
268 | - end | ||
269 | - | ||
270 | - p = the_prompts["#{l.id}, #{r.id}"] | ||
271 | - if p.nil? | ||
272 | - the_hash[l.id][r.id] = 0 | ||
273 | - else | ||
274 | - the_hash[l.id][r.id] = p.appearances.size | ||
275 | - end | ||
276 | - end | ||
277 | - end | ||
278 | - | ||
279 | - the_hash.sort.each do |xval, row| | ||
280 | - rowarray = [] | ||
281 | - row.sort.each do |yval, cell| | ||
282 | - rowarray << cell | ||
283 | - end | ||
284 | - puts rowarray.join(", ") | ||
285 | - end | ||
286 | - end | ||
287 | - | ||
288 | 71 | ||
289 | desc "Generate density information for each question - should be run nightly" | 72 | desc "Generate density information for each question - should be run nightly" |
290 | task(:generate_density_information => :environment) do | 73 | task(:generate_density_information => :environment) do |
@@ -663,8 +446,11 @@ namespace :test_api do | @@ -663,8 +446,11 @@ namespace :test_api do | ||
663 | 446 | ||
664 | desc "Ensure that a question has: answered_appearances == votes + skips" | 447 | desc "Ensure that a question has: answered_appearances == votes + skips" |
665 | task :answered_appearances_equals_votes_and_skips, [:question_id] => :environment do |t, args| | 448 | task :answered_appearances_equals_votes_and_skips, [:question_id] => :environment do |t, args| |
666 | - question = Question.find(args[:question_id]) | ||
667 | - puts answered_appearances_equals_votes_and_skips(question).inspect | 449 | + a = cleanup_args(args) |
450 | + questions = Question.find(a[:question_id]) | ||
451 | + questions.each do |question| | ||
452 | + puts answered_appearances_equals_votes_and_skips(question).inspect | ||
453 | + end | ||
668 | end | 454 | end |
669 | 455 | ||
670 | def answered_appearances_equals_votes_and_skips(question) | 456 | def answered_appearances_equals_votes_and_skips(question) |
@@ -726,3 +512,14 @@ namespace :test_api do | @@ -726,3 +512,14 @@ namespace :test_api do | ||
726 | end | 512 | end |
727 | end | 513 | end |
728 | 514 | ||
515 | +def cleanup_args(args) | ||
516 | + args.with_defaults(:question_id => :all, :choice_id => :all) | ||
517 | + a = args.to_hash | ||
518 | + if a[:question_id] != :all | ||
519 | + a[:question_id] = a[:question_id].split(".") | ||
520 | + end | ||
521 | + if a[:choice_id] != :all | ||
522 | + a[:choice_id] = a[:choice_id].split(".") | ||
523 | + end | ||
524 | + a | ||
525 | +end |