Merged updates from trunk into stable branch
[feedcatcher.git] / vendor / rails / activerecord / lib / active_record / calculations.rb
1 module ActiveRecord
2 module Calculations #:nodoc:
3 CALCULATIONS_OPTIONS = [:conditions, :joins, :order, :select, :group, :having, :distinct, :limit, :offset, :include, :from]
4 def self.included(base)
5 base.extend(ClassMethods)
6 end
7
8 module ClassMethods
9 # Count operates using three different approaches.
10 #
11 # * Count all: By not passing any parameters to count, it will return a count of all the rows for the model.
12 # * Count using column: By passing a column name to count, it will return a count of all the rows for the model with supplied column present
13 # * Count using options will find the row count matched by the options used.
14 #
15 # The third approach, count using options, accepts an option hash as the only parameter. The options are:
16 #
17 # * <tt>:conditions</tt>: An SQL fragment like "administrator = 1" or [ "user_name = ?", username ]. See conditions in the intro to ActiveRecord::Base.
18 # * <tt>:joins</tt>: Either an SQL fragment for additional joins like "LEFT JOIN comments ON comments.post_id = id" (rarely needed)
19 # or named associations in the same form used for the <tt>:include</tt> option, which will perform an INNER JOIN on the associated table(s).
20 # If the value is a string, then the records will be returned read-only since they will have attributes that do not correspond to the table's columns.
21 # Pass <tt>:readonly => false</tt> to override.
22 # * <tt>:include</tt>: Named associations that should be loaded alongside using LEFT OUTER JOINs. The symbols named refer
23 # to already defined associations. When using named associations, count returns the number of DISTINCT items for the model you're counting.
24 # See eager loading under Associations.
25 # * <tt>:order</tt>: An SQL fragment like "created_at DESC, name" (really only used with GROUP BY calculations).
26 # * <tt>:group</tt>: An attribute name by which the result should be grouped. Uses the GROUP BY SQL-clause.
27 # * <tt>:select</tt>: By default, this is * as in SELECT * FROM, but can be changed if you, for example, want to do a join but not
28 # include the joined columns.
29 # * <tt>:distinct</tt>: Set this to true to make this a distinct calculation, such as SELECT COUNT(DISTINCT posts.id) ...
30 # * <tt>:from</tt> - By default, this is the table name of the class, but can be changed to an alternate table name (or even the name
31 # of a database view).
32 #
33 # Examples for counting all:
34 # Person.count # returns the total count of all people
35 #
36 # Examples for counting by column:
37 # Person.count(:age) # returns the total count of all people whose age is present in database
38 #
39 # Examples for count with options:
40 # Person.count(:conditions => "age > 26")
41 # Person.count(:conditions => "age > 26 AND job.salary > 60000", :include => :job) # because of the named association, it finds the DISTINCT count using LEFT OUTER JOIN.
42 # Person.count(:conditions => "age > 26 AND job.salary > 60000", :joins => "LEFT JOIN jobs on jobs.person_id = person.id") # finds the number of rows matching the conditions and joins.
43 # Person.count('id', :conditions => "age > 26") # Performs a COUNT(id)
44 # Person.count(:all, :conditions => "age > 26") # Performs a COUNT(*) (:all is an alias for '*')
45 #
46 # Note: <tt>Person.count(:all)</tt> will not work because it will use <tt>:all</tt> as the condition. Use Person.count instead.
47 def count(*args)
48 calculate(:count, *construct_count_options_from_args(*args))
49 end
50
51 # Calculates the average value on a given column. The value is returned as
52 # a float, or +nil+ if there's no row. See +calculate+ for examples with
53 # options.
54 #
55 # Person.average('age') # => 35.8
56 def average(column_name, options = {})
57 calculate(:avg, column_name, options)
58 end
59
60 # Calculates the minimum value on a given column. The value is returned
61 # with the same data type of the column, or +nil+ if there's no row. See
62 # +calculate+ for examples with options.
63 #
64 # Person.minimum('age') # => 7
65 def minimum(column_name, options = {})
66 calculate(:min, column_name, options)
67 end
68
69 # Calculates the maximum value on a given column. The value is returned
70 # with the same data type of the column, or +nil+ if there's no row. See
71 # +calculate+ for examples with options.
72 #
73 # Person.maximum('age') # => 93
74 def maximum(column_name, options = {})
75 calculate(:max, column_name, options)
76 end
77
78 # Calculates the sum of values on a given column. The value is returned
79 # with the same data type of the column, 0 if there's no row. See
80 # +calculate+ for examples with options.
81 #
82 # Person.sum('age') # => 4562
83 def sum(column_name, options = {})
84 calculate(:sum, column_name, options)
85 end
86
87 # This calculates aggregate values in the given column. Methods for count, sum, average, minimum, and maximum have been added as shortcuts.
88 # Options such as <tt>:conditions</tt>, <tt>:order</tt>, <tt>:group</tt>, <tt>:having</tt>, and <tt>:joins</tt> can be passed to customize the query.
89 #
90 # There are two basic forms of output:
91 # * Single aggregate value: The single value is type cast to Fixnum for COUNT, Float for AVG, and the given column's type for everything else.
92 # * Grouped values: This returns an ordered hash of the values and groups them by the <tt>:group</tt> option. It takes either a column name, or the name
93 # of a belongs_to association.
94 #
95 # values = Person.maximum(:age, :group => 'last_name')
96 # puts values["Drake"]
97 # => 43
98 #
99 # drake = Family.find_by_last_name('Drake')
100 # values = Person.maximum(:age, :group => :family) # Person belongs_to :family
101 # puts values[drake]
102 # => 43
103 #
104 # values.each do |family, max_age|
105 # ...
106 # end
107 #
108 # Options:
109 # * <tt>:conditions</tt> - An SQL fragment like "administrator = 1" or [ "user_name = ?", username ]. See conditions in the intro to ActiveRecord::Base.
110 # * <tt>:include</tt>: Eager loading, see Associations for details. Since calculations don't load anything, the purpose of this is to access fields on joined tables in your conditions, order, or group clauses.
111 # * <tt>:joins</tt> - An SQL fragment for additional joins like "LEFT JOIN comments ON comments.post_id = id". (Rarely needed).
112 # The records will be returned read-only since they will have attributes that do not correspond to the table's columns.
113 # * <tt>:order</tt> - An SQL fragment like "created_at DESC, name" (really only used with GROUP BY calculations).
114 # * <tt>:group</tt> - An attribute name by which the result should be grouped. Uses the GROUP BY SQL-clause.
115 # * <tt>:select</tt> - By default, this is * as in SELECT * FROM, but can be changed if you for example want to do a join, but not
116 # include the joined columns.
117 # * <tt>:distinct</tt> - Set this to true to make this a distinct calculation, such as SELECT COUNT(DISTINCT posts.id) ...
118 #
119 # Examples:
120 # Person.calculate(:count, :all) # The same as Person.count
121 # Person.average(:age) # SELECT AVG(age) FROM people...
122 # Person.minimum(:age, :conditions => ['last_name != ?', 'Drake']) # Selects the minimum age for everyone with a last name other than 'Drake'
123 # Person.minimum(:age, :having => 'min(age) > 17', :group => :last_name) # Selects the minimum age for any family without any minors
124 # Person.sum("2 * age")
125 def calculate(operation, column_name, options = {})
126 validate_calculation_options(operation, options)
127 column_name = options[:select] if options[:select]
128 column_name = '*' if column_name == :all
129 column = column_for column_name
130 catch :invalid_query do
131 if options[:group]
132 return execute_grouped_calculation(operation, column_name, column, options)
133 else
134 return execute_simple_calculation(operation, column_name, column, options)
135 end
136 end
137 0
138 end
139
140 protected
141 def construct_count_options_from_args(*args)
142 options = {}
143 column_name = :all
144
145 # We need to handle
146 # count()
147 # count(:column_name=:all)
148 # count(options={})
149 # count(column_name=:all, options={})
150 # selects specified by scopes
151 case args.size
152 when 0
153 column_name = scope(:find)[:select] if scope(:find)
154 when 1
155 if args[0].is_a?(Hash)
156 column_name = scope(:find)[:select] if scope(:find)
157 options = args[0]
158 else
159 column_name = args[0]
160 end
161 when 2
162 column_name, options = args
163 else
164 raise ArgumentError, "Unexpected parameters passed to count(): #{args.inspect}"
165 end
166
167 [column_name || :all, options]
168 end
169
170 def construct_calculation_sql(operation, column_name, options) #:nodoc:
171 operation = operation.to_s.downcase
172 options = options.symbolize_keys
173
174 scope = scope(:find)
175 merged_includes = merge_includes(scope ? scope[:include] : [], options[:include])
176 aggregate_alias = column_alias_for(operation, column_name)
177 column_name = "#{connection.quote_table_name(table_name)}.#{column_name}" if column_names.include?(column_name.to_s)
178
179 if operation == 'count'
180 if merged_includes.any?
181 options[:distinct] = true
182 column_name = options[:select] || [connection.quote_table_name(table_name), primary_key] * '.'
183 end
184
185 if options[:distinct]
186 use_workaround = !connection.supports_count_distinct?
187 end
188 end
189
190 if options[:distinct] && column_name.to_s !~ /\s*DISTINCT\s+/i
191 distinct = 'DISTINCT '
192 end
193 sql = "SELECT #{operation}(#{distinct}#{column_name}) AS #{aggregate_alias}"
194
195 # A (slower) workaround if we're using a backend, like sqlite, that doesn't support COUNT DISTINCT.
196 sql = "SELECT COUNT(*) AS #{aggregate_alias}" if use_workaround
197
198 sql << ", #{options[:group_field]} AS #{options[:group_alias]}" if options[:group]
199 if options[:from]
200 sql << " FROM #{options[:from]} "
201 else
202 sql << " FROM (SELECT #{distinct}#{column_name}" if use_workaround
203 sql << " FROM #{connection.quote_table_name(table_name)} "
204 end
205
206 joins = ""
207 add_joins!(joins, options[:joins], scope)
208
209 if merged_includes.any?
210 join_dependency = ActiveRecord::Associations::ClassMethods::JoinDependency.new(self, merged_includes, joins)
211 sql << join_dependency.join_associations.collect{|join| join.association_join }.join
212 end
213
214 sql << joins unless joins.blank?
215
216 add_conditions!(sql, options[:conditions], scope)
217 add_limited_ids_condition!(sql, options, join_dependency) if join_dependency && !using_limitable_reflections?(join_dependency.reflections) && ((scope && scope[:limit]) || options[:limit])
218
219 if options[:group]
220 group_key = connection.adapter_name == 'FrontBase' ? :group_alias : :group_field
221 sql << " GROUP BY #{options[group_key]} "
222 end
223
224 if options[:group] && options[:having]
225 having = sanitize_sql_for_conditions(options[:having])
226
227 # FrontBase requires identifiers in the HAVING clause and chokes on function calls
228 if connection.adapter_name == 'FrontBase'
229 having.downcase!
230 having.gsub!(/#{operation}\s*\(\s*#{column_name}\s*\)/, aggregate_alias)
231 end
232
233 sql << " HAVING #{having} "
234 end
235
236 sql << " ORDER BY #{options[:order]} " if options[:order]
237 add_limit!(sql, options, scope)
238 sql << ") #{aggregate_alias}_subquery" if use_workaround
239 sql
240 end
241
242 def execute_simple_calculation(operation, column_name, column, options) #:nodoc:
243 value = connection.select_value(construct_calculation_sql(operation, column_name, options))
244 type_cast_calculated_value(value, column, operation)
245 end
246
247 def execute_grouped_calculation(operation, column_name, column, options) #:nodoc:
248 group_attr = options[:group].to_s
249 association = reflect_on_association(group_attr.to_sym)
250 associated = association && association.macro == :belongs_to # only count belongs_to associations
251 group_field = associated ? association.primary_key_name : group_attr
252 group_alias = column_alias_for(group_field)
253 group_column = column_for group_field
254 sql = construct_calculation_sql(operation, column_name, options.merge(:group_field => group_field, :group_alias => group_alias))
255 calculated_data = connection.select_all(sql)
256 aggregate_alias = column_alias_for(operation, column_name)
257
258 if association
259 key_ids = calculated_data.collect { |row| row[group_alias] }
260 key_records = association.klass.base_class.find(key_ids)
261 key_records = key_records.inject({}) { |hsh, r| hsh.merge(r.id => r) }
262 end
263
264 calculated_data.inject(ActiveSupport::OrderedHash.new) do |all, row|
265 key = type_cast_calculated_value(row[group_alias], group_column)
266 key = key_records[key] if associated
267 value = row[aggregate_alias]
268 all[key] = type_cast_calculated_value(value, column, operation)
269 all
270 end
271 end
272
273 private
274 def validate_calculation_options(operation, options = {})
275 options.assert_valid_keys(CALCULATIONS_OPTIONS)
276 end
277
278 # Converts the given keys to the value that the database adapter returns as
279 # a usable column name:
280 #
281 # column_alias_for("users.id") # => "users_id"
282 # column_alias_for("sum(id)") # => "sum_id"
283 # column_alias_for("count(distinct users.id)") # => "count_distinct_users_id"
284 # column_alias_for("count(*)") # => "count_all"
285 # column_alias_for("count", "id") # => "count_id"
286 def column_alias_for(*keys)
287 table_name = keys.join(' ')
288 table_name.downcase!
289 table_name.gsub!(/\*/, 'all')
290 table_name.gsub!(/\W+/, ' ')
291 table_name.strip!
292 table_name.gsub!(/ +/, '_')
293
294 connection.table_alias_for(table_name)
295 end
296
297 def column_for(field)
298 field_name = field.to_s.split('.').last
299 columns.detect { |c| c.name.to_s == field_name }
300 end
301
302 def type_cast_calculated_value(value, column, operation = nil)
303 operation = operation.to_s.downcase
304 case operation
305 when 'count' then value.to_i
306 when 'sum' then type_cast_using_column(value || '0', column)
307 when 'avg' then value && (value.is_a?(Fixnum) ? value.to_f : value).to_d
308 else type_cast_using_column(value, column)
309 end
310 end
311
312 def type_cast_using_column(value, column)
313 column ? column.type_cast(value) : value
314 end
315 end
316 end
317 end