1""" 2Extensions to Django's model logic. 3""" 4 5import django.core.exceptions 6from django.db import backend 7from django.db import connection 8from django.db import connections 9from django.db import models as dbmodels 10from django.db import transaction 11from django.db.models.sql import query 12import django.db.models.sql.where 13from django.utils import datastructures 14from autotest_lib.client.common_lib.cros.graphite import autotest_stats 15from autotest_lib.frontend.afe import rdb_model_extensions 16 17 18class ValidationError(django.core.exceptions.ValidationError): 19 """\ 20 Data validation error in adding or updating an object. The associated 21 value is a dictionary mapping field names to error strings. 22 """ 23 24def _quote_name(name): 25 """Shorthand for connection.ops.quote_name().""" 26 return connection.ops.quote_name(name) 27 28 29class LeasedHostManager(dbmodels.Manager): 30 """Query manager for unleased, unlocked hosts. 31 """ 32 def get_query_set(self): 33 return (super(LeasedHostManager, self).get_query_set().filter( 34 leased=0, locked=0)) 35 36 37class ExtendedManager(dbmodels.Manager): 38 """\ 39 Extended manager supporting subquery filtering. 40 """ 41 42 class CustomQuery(query.Query): 43 def __init__(self, *args, **kwargs): 44 super(ExtendedManager.CustomQuery, self).__init__(*args, **kwargs) 45 self._custom_joins = [] 46 47 48 def clone(self, klass=None, **kwargs): 49 obj = super(ExtendedManager.CustomQuery, self).clone(klass) 50 obj._custom_joins = list(self._custom_joins) 51 return obj 52 53 54 def combine(self, rhs, connector): 55 super(ExtendedManager.CustomQuery, self).combine(rhs, connector) 56 if hasattr(rhs, '_custom_joins'): 57 self._custom_joins.extend(rhs._custom_joins) 58 59 60 def add_custom_join(self, table, condition, join_type, 61 condition_values=(), alias=None): 62 if alias is None: 63 alias = table 64 join_dict = dict(table=table, 65 condition=condition, 66 condition_values=condition_values, 67 join_type=join_type, 68 alias=alias) 69 self._custom_joins.append(join_dict) 70 71 72 @classmethod 73 def convert_query(self, query_set): 74 """ 75 Convert the query set's "query" attribute to a CustomQuery. 76 """ 77 # Make a copy of the query set 78 query_set = query_set.all() 79 query_set.query = query_set.query.clone( 80 klass=ExtendedManager.CustomQuery, 81 _custom_joins=[]) 82 return query_set 83 84 85 class _WhereClause(object): 86 """Object allowing us to inject arbitrary SQL into Django queries. 87 88 By using this instead of extra(where=...), we can still freely combine 89 queries with & and |. 90 """ 91 def __init__(self, clause, values=()): 92 self._clause = clause 93 self._values = values 94 95 96 def as_sql(self, qn=None, connection=None): 97 return self._clause, self._values 98 99 100 def relabel_aliases(self, change_map): 101 return 102 103 104 def add_join(self, query_set, join_table, join_key, join_condition='', 105 join_condition_values=(), join_from_key=None, alias=None, 106 suffix='', exclude=False, force_left_join=False): 107 """Add a join to query_set. 108 109 Join looks like this: 110 (INNER|LEFT) JOIN <join_table> AS <alias> 111 ON (<this table>.<join_from_key> = <join_table>.<join_key> 112 and <join_condition>) 113 114 @param join_table table to join to 115 @param join_key field referencing back to this model to use for the join 116 @param join_condition extra condition for the ON clause of the join 117 @param join_condition_values values to substitute into join_condition 118 @param join_from_key column on this model to join from. 119 @param alias alias to use for for join 120 @param suffix suffix to add to join_table for the join alias, if no 121 alias is provided 122 @param exclude if true, exclude rows that match this join (will use a 123 LEFT OUTER JOIN and an appropriate WHERE condition) 124 @param force_left_join - if true, a LEFT OUTER JOIN will be used 125 instead of an INNER JOIN regardless of other options 126 """ 127 join_from_table = query_set.model._meta.db_table 128 if join_from_key is None: 129 join_from_key = self.model._meta.pk.name 130 if alias is None: 131 alias = join_table + suffix 132 full_join_key = _quote_name(alias) + '.' + _quote_name(join_key) 133 full_join_condition = '%s = %s.%s' % (full_join_key, 134 _quote_name(join_from_table), 135 _quote_name(join_from_key)) 136 if join_condition: 137 full_join_condition += ' AND (' + join_condition + ')' 138 if exclude or force_left_join: 139 join_type = query_set.query.LOUTER 140 else: 141 join_type = query_set.query.INNER 142 143 query_set = self.CustomQuery.convert_query(query_set) 144 query_set.query.add_custom_join(join_table, 145 full_join_condition, 146 join_type, 147 condition_values=join_condition_values, 148 alias=alias) 149 150 if exclude: 151 query_set = query_set.extra(where=[full_join_key + ' IS NULL']) 152 153 return query_set 154 155 156 def _info_for_many_to_one_join(self, field, join_to_query, alias): 157 """ 158 @param field: the ForeignKey field on the related model 159 @param join_to_query: the query over the related model that we're 160 joining to 161 @param alias: alias of joined table 162 """ 163 info = {} 164 rhs_table = join_to_query.model._meta.db_table 165 info['rhs_table'] = rhs_table 166 info['rhs_column'] = field.column 167 info['lhs_column'] = field.rel.get_related_field().column 168 rhs_where = join_to_query.query.where 169 rhs_where.relabel_aliases({rhs_table: alias}) 170 compiler = join_to_query.query.get_compiler(using=join_to_query.db) 171 initial_clause, values = compiler.as_sql() 172 all_clauses = (initial_clause,) 173 if hasattr(join_to_query.query, 'extra_where'): 174 all_clauses += join_to_query.query.extra_where 175 info['where_clause'] = ( 176 ' AND '.join('(%s)' % clause for clause in all_clauses)) 177 info['values'] = values 178 return info 179 180 181 def _info_for_many_to_many_join(self, m2m_field, join_to_query, alias, 182 m2m_is_on_this_model): 183 """ 184 @param m2m_field: a Django field representing the M2M relationship. 185 It uses a pivot table with the following structure: 186 this model table <---> M2M pivot table <---> joined model table 187 @param join_to_query: the query over the related model that we're 188 joining to. 189 @param alias: alias of joined table 190 """ 191 if m2m_is_on_this_model: 192 # referenced field on this model 193 lhs_id_field = self.model._meta.pk 194 # foreign key on the pivot table referencing lhs_id_field 195 m2m_lhs_column = m2m_field.m2m_column_name() 196 # foreign key on the pivot table referencing rhd_id_field 197 m2m_rhs_column = m2m_field.m2m_reverse_name() 198 # referenced field on related model 199 rhs_id_field = m2m_field.rel.get_related_field() 200 else: 201 lhs_id_field = m2m_field.rel.get_related_field() 202 m2m_lhs_column = m2m_field.m2m_reverse_name() 203 m2m_rhs_column = m2m_field.m2m_column_name() 204 rhs_id_field = join_to_query.model._meta.pk 205 206 info = {} 207 info['rhs_table'] = m2m_field.m2m_db_table() 208 info['rhs_column'] = m2m_lhs_column 209 info['lhs_column'] = lhs_id_field.column 210 211 # select the ID of related models relevant to this join. we can only do 212 # a single join, so we need to gather this information up front and 213 # include it in the join condition. 214 rhs_ids = join_to_query.values_list(rhs_id_field.attname, flat=True) 215 assert len(rhs_ids) == 1, ('Many-to-many custom field joins can only ' 216 'match a single related object.') 217 rhs_id = rhs_ids[0] 218 219 info['where_clause'] = '%s.%s = %s' % (_quote_name(alias), 220 _quote_name(m2m_rhs_column), 221 rhs_id) 222 info['values'] = () 223 return info 224 225 226 def join_custom_field(self, query_set, join_to_query, alias, 227 left_join=True): 228 """Join to a related model to create a custom field in the given query. 229 230 This method is used to construct a custom field on the given query based 231 on a many-valued relationsip. join_to_query should be a simple query 232 (no joins) on the related model which returns at most one related row 233 per instance of this model. 234 235 For many-to-one relationships, the joined table contains the matching 236 row from the related model it one is related, NULL otherwise. 237 238 For many-to-many relationships, the joined table contains the matching 239 row if it's related, NULL otherwise. 240 """ 241 relationship_type, field = self.determine_relationship( 242 join_to_query.model) 243 244 if relationship_type == self.MANY_TO_ONE: 245 info = self._info_for_many_to_one_join(field, join_to_query, alias) 246 elif relationship_type == self.M2M_ON_RELATED_MODEL: 247 info = self._info_for_many_to_many_join( 248 m2m_field=field, join_to_query=join_to_query, alias=alias, 249 m2m_is_on_this_model=False) 250 elif relationship_type ==self.M2M_ON_THIS_MODEL: 251 info = self._info_for_many_to_many_join( 252 m2m_field=field, join_to_query=join_to_query, alias=alias, 253 m2m_is_on_this_model=True) 254 255 return self.add_join(query_set, info['rhs_table'], info['rhs_column'], 256 join_from_key=info['lhs_column'], 257 join_condition=info['where_clause'], 258 join_condition_values=info['values'], 259 alias=alias, 260 force_left_join=left_join) 261 262 263 def key_on_joined_table(self, join_to_query): 264 """Get a non-null column on the table joined for the given query. 265 266 This analyzes the join that would be produced if join_to_query were 267 passed to join_custom_field. 268 """ 269 relationship_type, field = self.determine_relationship( 270 join_to_query.model) 271 if relationship_type == self.MANY_TO_ONE: 272 return join_to_query.model._meta.pk.column 273 return field.m2m_column_name() # any column on the M2M table will do 274 275 276 def add_where(self, query_set, where, values=()): 277 query_set = query_set.all() 278 query_set.query.where.add(self._WhereClause(where, values), 279 django.db.models.sql.where.AND) 280 return query_set 281 282 283 def _get_quoted_field(self, table, field): 284 return _quote_name(table) + '.' + _quote_name(field) 285 286 287 def get_key_on_this_table(self, key_field=None): 288 if key_field is None: 289 # default to primary key 290 key_field = self.model._meta.pk.column 291 return self._get_quoted_field(self.model._meta.db_table, key_field) 292 293 294 def escape_user_sql(self, sql): 295 return sql.replace('%', '%%') 296 297 298 def _custom_select_query(self, query_set, selects): 299 """Execute a custom select query. 300 301 @param query_set: query set as returned by query_objects. 302 @param selects: Tables/Columns to select, e.g. tko_test_labels_list.id. 303 304 @returns: Result of the query as returned by cursor.fetchall(). 305 """ 306 compiler = query_set.query.get_compiler(using=query_set.db) 307 sql, params = compiler.as_sql() 308 from_ = sql[sql.find(' FROM'):] 309 310 if query_set.query.distinct: 311 distinct = 'DISTINCT ' 312 else: 313 distinct = '' 314 315 sql_query = ('SELECT ' + distinct + ','.join(selects) + from_) 316 # Chose the connection that's responsible for this type of object 317 cursor = connections[query_set.db].cursor() 318 cursor.execute(sql_query, params) 319 return cursor.fetchall() 320 321 322 def _is_relation_to(self, field, model_class): 323 return field.rel and field.rel.to is model_class 324 325 326 MANY_TO_ONE = object() 327 M2M_ON_RELATED_MODEL = object() 328 M2M_ON_THIS_MODEL = object() 329 330 def determine_relationship(self, related_model): 331 """ 332 Determine the relationship between this model and related_model. 333 334 related_model must have some sort of many-valued relationship to this 335 manager's model. 336 @returns (relationship_type, field), where relationship_type is one of 337 MANY_TO_ONE, M2M_ON_RELATED_MODEL, M2M_ON_THIS_MODEL, and field 338 is the Django field object for the relationship. 339 """ 340 # look for a foreign key field on related_model relating to this model 341 for field in related_model._meta.fields: 342 if self._is_relation_to(field, self.model): 343 return self.MANY_TO_ONE, field 344 345 # look for an M2M field on related_model relating to this model 346 for field in related_model._meta.many_to_many: 347 if self._is_relation_to(field, self.model): 348 return self.M2M_ON_RELATED_MODEL, field 349 350 # maybe this model has the many-to-many field 351 for field in self.model._meta.many_to_many: 352 if self._is_relation_to(field, related_model): 353 return self.M2M_ON_THIS_MODEL, field 354 355 raise ValueError('%s has no relation to %s' % 356 (related_model, self.model)) 357 358 359 def _get_pivot_iterator(self, base_objects_by_id, related_model): 360 """ 361 Determine the relationship between this model and related_model, and 362 return a pivot iterator. 363 @param base_objects_by_id: dict of instances of this model indexed by 364 their IDs 365 @returns a pivot iterator, which yields a tuple (base_object, 366 related_object) for each relationship between a base object and a 367 related object. all base_object instances come from base_objects_by_id. 368 Note -- this depends on Django model internals. 369 """ 370 relationship_type, field = self.determine_relationship(related_model) 371 if relationship_type == self.MANY_TO_ONE: 372 return self._many_to_one_pivot(base_objects_by_id, 373 related_model, field) 374 elif relationship_type == self.M2M_ON_RELATED_MODEL: 375 return self._many_to_many_pivot( 376 base_objects_by_id, related_model, field.m2m_db_table(), 377 field.m2m_reverse_name(), field.m2m_column_name()) 378 else: 379 assert relationship_type == self.M2M_ON_THIS_MODEL 380 return self._many_to_many_pivot( 381 base_objects_by_id, related_model, field.m2m_db_table(), 382 field.m2m_column_name(), field.m2m_reverse_name()) 383 384 385 def _many_to_one_pivot(self, base_objects_by_id, related_model, 386 foreign_key_field): 387 """ 388 @returns a pivot iterator - see _get_pivot_iterator() 389 """ 390 filter_data = {foreign_key_field.name + '__pk__in': 391 base_objects_by_id.keys()} 392 for related_object in related_model.objects.filter(**filter_data): 393 # lookup base object in the dict, rather than grabbing it from the 394 # related object. we need to return instances from the dict, not 395 # fresh instances of the same models (and grabbing model instances 396 # from the related models incurs a DB query each time). 397 base_object_id = getattr(related_object, foreign_key_field.attname) 398 base_object = base_objects_by_id[base_object_id] 399 yield base_object, related_object 400 401 402 def _query_pivot_table(self, base_objects_by_id, pivot_table, 403 pivot_from_field, pivot_to_field, related_model): 404 """ 405 @param id_list list of IDs of self.model objects to include 406 @param pivot_table the name of the pivot table 407 @param pivot_from_field a field name on pivot_table referencing 408 self.model 409 @param pivot_to_field a field name on pivot_table referencing the 410 related model. 411 @param related_model the related model 412 413 @returns pivot list of IDs (base_id, related_id) 414 """ 415 query = """ 416 SELECT %(from_field)s, %(to_field)s 417 FROM %(table)s 418 WHERE %(from_field)s IN (%(id_list)s) 419 """ % dict(from_field=pivot_from_field, 420 to_field=pivot_to_field, 421 table=pivot_table, 422 id_list=','.join(str(id_) for id_ 423 in base_objects_by_id.iterkeys())) 424 425 # Chose the connection that's responsible for this type of object 426 # The databases for related_model and the current model will always 427 # be the same, related_model is just easier to obtain here because 428 # self is only a ExtendedManager, not the object. 429 cursor = connections[related_model.objects.db].cursor() 430 cursor.execute(query) 431 return cursor.fetchall() 432 433 434 def _many_to_many_pivot(self, base_objects_by_id, related_model, 435 pivot_table, pivot_from_field, pivot_to_field): 436 """ 437 @param pivot_table: see _query_pivot_table 438 @param pivot_from_field: see _query_pivot_table 439 @param pivot_to_field: see _query_pivot_table 440 @returns a pivot iterator - see _get_pivot_iterator() 441 """ 442 id_pivot = self._query_pivot_table(base_objects_by_id, pivot_table, 443 pivot_from_field, pivot_to_field, 444 related_model) 445 446 all_related_ids = list(set(related_id for base_id, related_id 447 in id_pivot)) 448 related_objects_by_id = related_model.objects.in_bulk(all_related_ids) 449 450 for base_id, related_id in id_pivot: 451 yield base_objects_by_id[base_id], related_objects_by_id[related_id] 452 453 454 def populate_relationships(self, base_objects, related_model, 455 related_list_name): 456 """ 457 For each instance of this model in base_objects, add a field named 458 related_list_name listing all the related objects of type related_model. 459 related_model must be in a many-to-one or many-to-many relationship with 460 this model. 461 @param base_objects - list of instances of this model 462 @param related_model - model class related to this model 463 @param related_list_name - attribute name in which to store the related 464 object list. 465 """ 466 if not base_objects: 467 # if we don't bail early, we'll get a SQL error later 468 return 469 470 base_objects_by_id = dict((base_object._get_pk_val(), base_object) 471 for base_object in base_objects) 472 pivot_iterator = self._get_pivot_iterator(base_objects_by_id, 473 related_model) 474 475 for base_object in base_objects: 476 setattr(base_object, related_list_name, []) 477 478 for base_object, related_object in pivot_iterator: 479 getattr(base_object, related_list_name).append(related_object) 480 481 482class ModelWithInvalidQuerySet(dbmodels.query.QuerySet): 483 """ 484 QuerySet that handles delete() properly for models with an "invalid" bit 485 """ 486 def delete(self): 487 for model in self: 488 model.delete() 489 490 491class ModelWithInvalidManager(ExtendedManager): 492 """ 493 Manager for objects with an "invalid" bit 494 """ 495 def get_query_set(self): 496 return ModelWithInvalidQuerySet(self.model) 497 498 499class ValidObjectsManager(ModelWithInvalidManager): 500 """ 501 Manager returning only objects with invalid=False. 502 """ 503 def get_query_set(self): 504 queryset = super(ValidObjectsManager, self).get_query_set() 505 return queryset.filter(invalid=False) 506 507 508class ModelExtensions(rdb_model_extensions.ModelValidators): 509 """\ 510 Mixin with convenience functions for models, built on top of 511 the model validators in rdb_model_extensions. 512 """ 513 # TODO: at least some of these functions really belong in a custom 514 # Manager class 515 516 517 SERIALIZATION_LINKS_TO_FOLLOW = set() 518 """ 519 To be able to send jobs and hosts to shards, it's necessary to find their 520 dependencies. 521 The most generic approach for this would be to traverse all relationships 522 to other objects recursively. This would list all objects that are related 523 in any way. 524 But this approach finds too many objects: If a host should be transferred, 525 all it's relationships would be traversed. This would find an acl group. 526 If then the acl group's relationships are traversed, the relationship 527 would be followed backwards and many other hosts would be found. 528 529 This mapping tells that algorithm which relations to follow explicitly. 530 """ 531 532 533 SERIALIZATION_LINKS_TO_KEEP = set() 534 """This set stores foreign keys which we don't want to follow, but 535 still want to include in the serialized dictionary. For 536 example, we follow the relationship `Host.hostattribute_set`, 537 but we do not want to follow `HostAttributes.host_id` back to 538 to Host, which would otherwise lead to a circle. However, we still 539 like to serialize HostAttribute.`host_id`.""" 540 541 SERIALIZATION_LOCAL_LINKS_TO_UPDATE = set() 542 """ 543 On deserializion, if the object to persist already exists, local fields 544 will only be updated, if their name is in this set. 545 """ 546 547 548 @classmethod 549 def convert_human_readable_values(cls, data, to_human_readable=False): 550 """\ 551 Performs conversions on user-supplied field data, to make it 552 easier for users to pass human-readable data. 553 554 For all fields that have choice sets, convert their values 555 from human-readable strings to enum values, if necessary. This 556 allows users to pass strings instead of the corresponding 557 integer values. 558 559 For all foreign key fields, call smart_get with the supplied 560 data. This allows the user to pass either an ID value or 561 the name of the object as a string. 562 563 If to_human_readable=True, perform the inverse - i.e. convert 564 numeric values to human readable values. 565 566 This method modifies data in-place. 567 """ 568 field_dict = cls.get_field_dict() 569 for field_name in data: 570 if field_name not in field_dict or data[field_name] is None: 571 continue 572 field_obj = field_dict[field_name] 573 # convert enum values 574 if field_obj.choices: 575 for choice_data in field_obj.choices: 576 # choice_data is (value, name) 577 if to_human_readable: 578 from_val, to_val = choice_data 579 else: 580 to_val, from_val = choice_data 581 if from_val == data[field_name]: 582 data[field_name] = to_val 583 break 584 # convert foreign key values 585 elif field_obj.rel: 586 dest_obj = field_obj.rel.to.smart_get(data[field_name], 587 valid_only=False) 588 if to_human_readable: 589 # parameterized_jobs do not have a name_field 590 if (field_name != 'parameterized_job' and 591 dest_obj.name_field is not None): 592 data[field_name] = getattr(dest_obj, 593 dest_obj.name_field) 594 else: 595 data[field_name] = dest_obj 596 597 598 599 600 def _validate_unique(self): 601 """\ 602 Validate that unique fields are unique. Django manipulators do 603 this too, but they're a huge pain to use manually. Trust me. 604 """ 605 errors = {} 606 cls = type(self) 607 field_dict = self.get_field_dict() 608 manager = cls.get_valid_manager() 609 for field_name, field_obj in field_dict.iteritems(): 610 if not field_obj.unique: 611 continue 612 613 value = getattr(self, field_name) 614 if value is None and field_obj.auto_created: 615 # don't bother checking autoincrement fields about to be 616 # generated 617 continue 618 619 existing_objs = manager.filter(**{field_name : value}) 620 num_existing = existing_objs.count() 621 622 if num_existing == 0: 623 continue 624 if num_existing == 1 and existing_objs[0].id == self.id: 625 continue 626 errors[field_name] = ( 627 'This value must be unique (%s)' % (value)) 628 return errors 629 630 631 def _validate(self): 632 """ 633 First coerces all fields on this instance to their proper Python types. 634 Then runs validation on every field. Returns a dictionary of 635 field_name -> error_list. 636 637 Based on validate() from django.db.models.Model in Django 0.96, which 638 was removed in Django 1.0. It should reappear in a later version. See: 639 http://code.djangoproject.com/ticket/6845 640 """ 641 error_dict = {} 642 for f in self._meta.fields: 643 try: 644 python_value = f.to_python( 645 getattr(self, f.attname, f.get_default())) 646 except django.core.exceptions.ValidationError, e: 647 error_dict[f.name] = str(e) 648 continue 649 650 if not f.blank and not python_value: 651 error_dict[f.name] = 'This field is required.' 652 continue 653 654 setattr(self, f.attname, python_value) 655 656 return error_dict 657 658 659 def do_validate(self): 660 errors = self._validate() 661 unique_errors = self._validate_unique() 662 for field_name, error in unique_errors.iteritems(): 663 errors.setdefault(field_name, error) 664 if errors: 665 raise ValidationError(errors) 666 667 668 # actually (externally) useful methods follow 669 670 @classmethod 671 def add_object(cls, data={}, **kwargs): 672 """\ 673 Returns a new object created with the given data (a dictionary 674 mapping field names to values). Merges any extra keyword args 675 into data. 676 """ 677 data = dict(data) 678 data.update(kwargs) 679 data = cls.prepare_data_args(data) 680 cls.convert_human_readable_values(data) 681 data = cls.provide_default_values(data) 682 683 obj = cls(**data) 684 obj.do_validate() 685 obj.save() 686 return obj 687 688 689 def update_object(self, data={}, **kwargs): 690 """\ 691 Updates the object with the given data (a dictionary mapping 692 field names to values). Merges any extra keyword args into 693 data. 694 """ 695 data = dict(data) 696 data.update(kwargs) 697 data = self.prepare_data_args(data) 698 self.convert_human_readable_values(data) 699 for field_name, value in data.iteritems(): 700 setattr(self, field_name, value) 701 self.do_validate() 702 self.save() 703 704 705 # see query_objects() 706 _SPECIAL_FILTER_KEYS = ('query_start', 'query_limit', 'sort_by', 707 'extra_args', 'extra_where', 'no_distinct') 708 709 710 @classmethod 711 def _extract_special_params(cls, filter_data): 712 """ 713 @returns a tuple of dicts (special_params, regular_filters), where 714 special_params contains the parameters we handle specially and 715 regular_filters is the remaining data to be handled by Django. 716 """ 717 regular_filters = dict(filter_data) 718 special_params = {} 719 for key in cls._SPECIAL_FILTER_KEYS: 720 if key in regular_filters: 721 special_params[key] = regular_filters.pop(key) 722 return special_params, regular_filters 723 724 725 @classmethod 726 def apply_presentation(cls, query, filter_data): 727 """ 728 Apply presentation parameters -- sorting and paging -- to the given 729 query. 730 @returns new query with presentation applied 731 """ 732 special_params, _ = cls._extract_special_params(filter_data) 733 sort_by = special_params.get('sort_by', None) 734 if sort_by: 735 assert isinstance(sort_by, list) or isinstance(sort_by, tuple) 736 query = query.extra(order_by=sort_by) 737 738 query_start = special_params.get('query_start', None) 739 query_limit = special_params.get('query_limit', None) 740 if query_start is not None: 741 if query_limit is None: 742 raise ValueError('Cannot pass query_start without query_limit') 743 # query_limit is passed as a page size 744 query_limit += query_start 745 return query[query_start:query_limit] 746 747 748 @classmethod 749 def query_objects(cls, filter_data, valid_only=True, initial_query=None, 750 apply_presentation=True): 751 """\ 752 Returns a QuerySet object for querying the given model_class 753 with the given filter_data. Optional special arguments in 754 filter_data include: 755 -query_start: index of first return to return 756 -query_limit: maximum number of results to return 757 -sort_by: list of fields to sort on. prefixing a '-' onto a 758 field name changes the sort to descending order. 759 -extra_args: keyword args to pass to query.extra() (see Django 760 DB layer documentation) 761 -extra_where: extra WHERE clause to append 762 -no_distinct: if True, a DISTINCT will not be added to the SELECT 763 """ 764 special_params, regular_filters = cls._extract_special_params( 765 filter_data) 766 767 if initial_query is None: 768 if valid_only: 769 initial_query = cls.get_valid_manager() 770 else: 771 initial_query = cls.objects 772 773 query = initial_query.filter(**regular_filters) 774 775 use_distinct = not special_params.get('no_distinct', False) 776 if use_distinct: 777 query = query.distinct() 778 779 extra_args = special_params.get('extra_args', {}) 780 extra_where = special_params.get('extra_where', None) 781 if extra_where: 782 # escape %'s 783 extra_where = cls.objects.escape_user_sql(extra_where) 784 extra_args.setdefault('where', []).append(extra_where) 785 if extra_args: 786 query = query.extra(**extra_args) 787 # TODO: Use readonly connection for these queries. 788 # This has been disabled, because it's not used anyway, as the 789 # configured readonly user is the same as the real user anyway. 790 791 if apply_presentation: 792 query = cls.apply_presentation(query, filter_data) 793 794 return query 795 796 797 @classmethod 798 def query_count(cls, filter_data, initial_query=None): 799 """\ 800 Like query_objects, but retreive only the count of results. 801 """ 802 filter_data.pop('query_start', None) 803 filter_data.pop('query_limit', None) 804 query = cls.query_objects(filter_data, initial_query=initial_query) 805 return query.count() 806 807 808 @classmethod 809 def clean_object_dicts(cls, field_dicts): 810 """\ 811 Take a list of dicts corresponding to object (as returned by 812 query.values()) and clean the data to be more suitable for 813 returning to the user. 814 """ 815 for field_dict in field_dicts: 816 cls.clean_foreign_keys(field_dict) 817 cls._convert_booleans(field_dict) 818 cls.convert_human_readable_values(field_dict, 819 to_human_readable=True) 820 821 822 @classmethod 823 def list_objects(cls, filter_data, initial_query=None): 824 """\ 825 Like query_objects, but return a list of dictionaries. 826 """ 827 query = cls.query_objects(filter_data, initial_query=initial_query) 828 extra_fields = query.query.extra_select.keys() 829 field_dicts = [model_object.get_object_dict(extra_fields=extra_fields) 830 for model_object in query] 831 return field_dicts 832 833 834 @classmethod 835 def smart_get(cls, id_or_name, valid_only=True): 836 """\ 837 smart_get(integer) -> get object by ID 838 smart_get(string) -> get object by name_field 839 """ 840 if valid_only: 841 manager = cls.get_valid_manager() 842 else: 843 manager = cls.objects 844 845 if isinstance(id_or_name, (int, long)): 846 return manager.get(pk=id_or_name) 847 if isinstance(id_or_name, basestring) and hasattr(cls, 'name_field'): 848 return manager.get(**{cls.name_field : id_or_name}) 849 raise ValueError( 850 'Invalid positional argument: %s (%s)' % (id_or_name, 851 type(id_or_name))) 852 853 854 @classmethod 855 def smart_get_bulk(cls, id_or_name_list): 856 invalid_inputs = [] 857 result_objects = [] 858 for id_or_name in id_or_name_list: 859 try: 860 result_objects.append(cls.smart_get(id_or_name)) 861 except cls.DoesNotExist: 862 invalid_inputs.append(id_or_name) 863 if invalid_inputs: 864 raise cls.DoesNotExist('The following %ss do not exist: %s' 865 % (cls.__name__.lower(), 866 ', '.join(invalid_inputs))) 867 return result_objects 868 869 870 def get_object_dict(self, extra_fields=None): 871 """\ 872 Return a dictionary mapping fields to this object's values. @param 873 extra_fields: list of extra attribute names to include, in addition to 874 the fields defined on this object. 875 """ 876 fields = self.get_field_dict().keys() 877 if extra_fields: 878 fields += extra_fields 879 object_dict = dict((field_name, getattr(self, field_name)) 880 for field_name in fields) 881 self.clean_object_dicts([object_dict]) 882 self._postprocess_object_dict(object_dict) 883 return object_dict 884 885 886 def _postprocess_object_dict(self, object_dict): 887 """For subclasses to override.""" 888 pass 889 890 891 @classmethod 892 def get_valid_manager(cls): 893 return cls.objects 894 895 896 def _record_attributes(self, attributes): 897 """ 898 See on_attribute_changed. 899 """ 900 assert not isinstance(attributes, basestring) 901 self._recorded_attributes = dict((attribute, getattr(self, attribute)) 902 for attribute in attributes) 903 904 905 def _check_for_updated_attributes(self): 906 """ 907 See on_attribute_changed. 908 """ 909 for attribute, original_value in self._recorded_attributes.iteritems(): 910 new_value = getattr(self, attribute) 911 if original_value != new_value: 912 self.on_attribute_changed(attribute, original_value) 913 self._record_attributes(self._recorded_attributes.keys()) 914 915 916 def on_attribute_changed(self, attribute, old_value): 917 """ 918 Called whenever an attribute is updated. To be overridden. 919 920 To use this method, you must: 921 * call _record_attributes() from __init__() (after making the super 922 call) with a list of attributes for which you want to be notified upon 923 change. 924 * call _check_for_updated_attributes() from save(). 925 """ 926 pass 927 928 929 def serialize(self, include_dependencies=True): 930 """Serializes the object with dependencies. 931 932 The variable SERIALIZATION_LINKS_TO_FOLLOW defines which dependencies 933 this function will serialize with the object. 934 935 @param include_dependencies: Whether or not to follow relations to 936 objects this object depends on. 937 This parameter is used when uploading 938 jobs from a shard to the master, as the 939 master already has all the dependent 940 objects. 941 942 @returns: Dictionary representation of the object. 943 """ 944 serialized = {} 945 timer = autotest_stats.Timer('serialize_latency.%s' % ( 946 type(self).__name__)) 947 with timer.get_client('local'): 948 for field in self._meta.concrete_model._meta.local_fields: 949 if field.rel is None: 950 serialized[field.name] = field._get_val_from_obj(self) 951 elif field.name in self.SERIALIZATION_LINKS_TO_KEEP: 952 # attname will contain "_id" suffix for foreign keys, 953 # e.g. HostAttribute.host will be serialized as 'host_id'. 954 # Use it for easy deserialization. 955 serialized[field.attname] = field._get_val_from_obj(self) 956 957 if include_dependencies: 958 with timer.get_client('related'): 959 for link in self.SERIALIZATION_LINKS_TO_FOLLOW: 960 serialized[link] = self._serialize_relation(link) 961 962 return serialized 963 964 965 def _serialize_relation(self, link): 966 """Serializes dependent objects given the name of the relation. 967 968 @param link: Name of the relation to take objects from. 969 970 @returns For To-Many relationships a list of the serialized related 971 objects, for To-One relationships the serialized related object. 972 """ 973 try: 974 attr = getattr(self, link) 975 except AttributeError: 976 # One-To-One relationships that point to None may raise this 977 return None 978 979 if attr is None: 980 return None 981 if hasattr(attr, 'all'): 982 return [obj.serialize() for obj in attr.all()] 983 return attr.serialize() 984 985 986 @classmethod 987 def _split_local_from_foreign_values(cls, data): 988 """This splits local from foreign values in a serialized object. 989 990 @param data: The serialized object. 991 992 @returns A tuple of two lists, both containing tuples in the form 993 (link_name, link_value). The first list contains all links 994 for local fields, the second one contains those for foreign 995 fields/objects. 996 """ 997 links_to_local_values, links_to_related_values = [], [] 998 for link, value in data.iteritems(): 999 if link in cls.SERIALIZATION_LINKS_TO_FOLLOW: 1000 # It's a foreign key 1001 links_to_related_values.append((link, value)) 1002 else: 1003 # It's a local attribute or a foreign key 1004 # we don't want to follow. 1005 links_to_local_values.append((link, value)) 1006 return links_to_local_values, links_to_related_values 1007 1008 1009 @classmethod 1010 def _filter_update_allowed_fields(cls, data): 1011 """Filters data and returns only files that updates are allowed on. 1012 1013 This is i.e. needed for syncing aborted bits from the master to shards. 1014 1015 Local links are only allowed to be updated, if they are in 1016 SERIALIZATION_LOCAL_LINKS_TO_UPDATE. 1017 Overwriting existing values is allowed in order to be able to sync i.e. 1018 the aborted bit from the master to a shard. 1019 1020 The whitelisting mechanism is in place to prevent overwriting local 1021 status: If all fields were overwritten, jobs would be completely be 1022 set back to their original (unstarted) state. 1023 1024 @param data: List with tuples of the form (link_name, link_value), as 1025 returned by _split_local_from_foreign_values. 1026 1027 @returns List of the same format as data, but only containing data for 1028 fields that updates are allowed on. 1029 """ 1030 return [pair for pair in data 1031 if pair[0] in cls.SERIALIZATION_LOCAL_LINKS_TO_UPDATE] 1032 1033 1034 @classmethod 1035 def delete_matching_record(cls, **filter_args): 1036 """Delete records matching the filter. 1037 1038 @param filter_args: Arguments for the django filter 1039 used to locate the record to delete. 1040 """ 1041 try: 1042 existing_record = cls.objects.get(**filter_args) 1043 except cls.DoesNotExist: 1044 return 1045 existing_record.delete() 1046 1047 1048 def _deserialize_local(self, data): 1049 """Set local attributes from a list of tuples. 1050 1051 @param data: List of tuples like returned by 1052 _split_local_from_foreign_values. 1053 """ 1054 if not data: 1055 return 1056 1057 for link, value in data: 1058 setattr(self, link, value) 1059 # Overwridden save() methods are prone to errors, so don't execute them. 1060 # This is because: 1061 # - the overwritten methods depend on ACL groups that don't yet exist 1062 # and don't handle errors 1063 # - the overwritten methods think this object already exists in the db 1064 # because the id is already set 1065 super(type(self), self).save() 1066 1067 1068 def _deserialize_relations(self, data): 1069 """Set foreign attributes from a list of tuples. 1070 1071 This deserialized the related objects using their own deserialize() 1072 function and then sets the relation. 1073 1074 @param data: List of tuples like returned by 1075 _split_local_from_foreign_values. 1076 """ 1077 for link, value in data: 1078 self._deserialize_relation(link, value) 1079 # See comment in _deserialize_local 1080 super(type(self), self).save() 1081 1082 1083 @classmethod 1084 def get_record(cls, data): 1085 """Retrieve a record with the data in the given input arg. 1086 1087 @param data: A dictionary containing the information to use in a query 1088 for data. If child models have different constraints of 1089 uniqueness they should override this model. 1090 1091 @return: An object with matching data. 1092 1093 @raises DoesNotExist: If a record with the given data doesn't exist. 1094 """ 1095 return cls.objects.get(id=data['id']) 1096 1097 1098 @classmethod 1099 def deserialize(cls, data): 1100 """Recursively deserializes and saves an object with it's dependencies. 1101 1102 This takes the result of the serialize method and creates objects 1103 in the database that are just like the original. 1104 1105 If an object of the same type with the same id already exists, it's 1106 local values will be left untouched, unless they are explicitly 1107 whitelisted in SERIALIZATION_LOCAL_LINKS_TO_UPDATE. 1108 1109 Deserialize will always recursively propagate to all related objects 1110 present in data though. 1111 I.e. this is necessary to add users to an already existing acl-group. 1112 1113 @param data: Representation of an object and its dependencies, as 1114 returned by serialize. 1115 1116 @returns: The object represented by data if it didn't exist before, 1117 otherwise the object that existed before and has the same type 1118 and id as the one described by data. 1119 """ 1120 if data is None: 1121 return None 1122 1123 local, related = cls._split_local_from_foreign_values(data) 1124 try: 1125 instance = cls.get_record(data) 1126 local = cls._filter_update_allowed_fields(local) 1127 except cls.DoesNotExist: 1128 instance = cls() 1129 1130 timer = autotest_stats.Timer('deserialize_latency.%s' % ( 1131 type(instance).__name__)) 1132 with timer.get_client('local'): 1133 instance._deserialize_local(local) 1134 with timer.get_client('related'): 1135 instance._deserialize_relations(related) 1136 1137 return instance 1138 1139 1140 def sanity_check_update_from_shard(self, shard, updated_serialized, 1141 *args, **kwargs): 1142 """Check if an update sent from a shard is legitimate. 1143 1144 @raises error.UnallowedRecordsSentToMaster if an update is not 1145 legitimate. 1146 """ 1147 raise NotImplementedError( 1148 'sanity_check_update_from_shard must be implemented by subclass %s ' 1149 'for type %s' % type(self)) 1150 1151 1152 @transaction.commit_on_success 1153 def update_from_serialized(self, serialized): 1154 """Updates local fields of an existing object from a serialized form. 1155 1156 This is different than the normal deserialize() in the way that it 1157 does update local values, which deserialize doesn't, but doesn't 1158 recursively propagate to related objects, which deserialize() does. 1159 1160 The use case of this function is to update job records on the master 1161 after the jobs have been executed on a slave, as the master is not 1162 interested in updates for users, labels, specialtasks, etc. 1163 1164 @param serialized: Representation of an object and its dependencies, as 1165 returned by serialize. 1166 1167 @raises ValueError: if serialized contains related objects, i.e. not 1168 only local fields. 1169 """ 1170 local, related = ( 1171 self._split_local_from_foreign_values(serialized)) 1172 if related: 1173 raise ValueError('Serialized must not contain foreign ' 1174 'objects: %s' % related) 1175 1176 self._deserialize_local(local) 1177 1178 1179 def custom_deserialize_relation(self, link, data): 1180 """Allows overriding the deserialization behaviour by subclasses.""" 1181 raise NotImplementedError( 1182 'custom_deserialize_relation must be implemented by subclass %s ' 1183 'for relation %s' % (type(self), link)) 1184 1185 1186 def _deserialize_relation(self, link, data): 1187 """Deserializes related objects and sets references on this object. 1188 1189 Relations that point to a list of objects are handled automatically. 1190 For many-to-one or one-to-one relations custom_deserialize_relation 1191 must be overridden by the subclass. 1192 1193 Related objects are deserialized using their deserialize() method. 1194 Thereby they and their dependencies are created if they don't exist 1195 and saved to the database. 1196 1197 @param link: Name of the relation. 1198 @param data: Serialized representation of the related object(s). 1199 This means a list of dictionaries for to-many relations, 1200 just a dictionary for to-one relations. 1201 """ 1202 field = getattr(self, link) 1203 1204 if field and hasattr(field, 'all'): 1205 self._deserialize_2m_relation(link, data, field.model) 1206 else: 1207 self.custom_deserialize_relation(link, data) 1208 1209 1210 def _deserialize_2m_relation(self, link, data, related_class): 1211 """Deserialize related objects for one to-many relationship. 1212 1213 @param link: Name of the relation. 1214 @param data: Serialized representation of the related objects. 1215 This is a list with of dictionaries. 1216 @param related_class: A class representing a django model, with which 1217 this class has a one-to-many relationship. 1218 """ 1219 relation_set = getattr(self, link) 1220 if related_class == self.get_attribute_model(): 1221 # When deserializing a model together with 1222 # its attributes, clear all the exising attributes to ensure 1223 # db consistency. Note 'update' won't be sufficient, as we also 1224 # want to remove any attributes that no longer exist in |data|. 1225 # 1226 # core_filters is a dictionary of filters, defines how 1227 # RelatedMangager would query for the 1-to-many relationship. E.g. 1228 # Host.objects.get( 1229 # id=20).hostattribute_set.core_filters = {host_id:20} 1230 # We use it to delete objects related to the current object. 1231 related_class.objects.filter(**relation_set.core_filters).delete() 1232 for serialized in data: 1233 relation_set.add(related_class.deserialize(serialized)) 1234 1235 1236 @classmethod 1237 def get_attribute_model(cls): 1238 """Return the attribute model. 1239 1240 Subclass with attribute-like model should override this to 1241 return the attribute model class. This method will be 1242 called by _deserialize_2m_relation to determine whether 1243 to clear the one-to-many relations first on deserialization of object. 1244 """ 1245 return None 1246 1247 1248class ModelWithInvalid(ModelExtensions): 1249 """ 1250 Overrides model methods save() and delete() to support invalidation in 1251 place of actual deletion. Subclasses must have a boolean "invalid" 1252 field. 1253 """ 1254 1255 def save(self, *args, **kwargs): 1256 first_time = (self.id is None) 1257 if first_time: 1258 # see if this object was previously added and invalidated 1259 my_name = getattr(self, self.name_field) 1260 filters = {self.name_field : my_name, 'invalid' : True} 1261 try: 1262 old_object = self.__class__.objects.get(**filters) 1263 self.resurrect_object(old_object) 1264 except self.DoesNotExist: 1265 # no existing object 1266 pass 1267 1268 super(ModelWithInvalid, self).save(*args, **kwargs) 1269 1270 1271 def resurrect_object(self, old_object): 1272 """ 1273 Called when self is about to be saved for the first time and is actually 1274 "undeleting" a previously deleted object. Can be overridden by 1275 subclasses to copy data as desired from the deleted entry (but this 1276 superclass implementation must normally be called). 1277 """ 1278 self.id = old_object.id 1279 1280 1281 def clean_object(self): 1282 """ 1283 This method is called when an object is marked invalid. 1284 Subclasses should override this to clean up relationships that 1285 should no longer exist if the object were deleted. 1286 """ 1287 pass 1288 1289 1290 def delete(self): 1291 self.invalid = self.invalid 1292 assert not self.invalid 1293 self.invalid = True 1294 self.save() 1295 self.clean_object() 1296 1297 1298 @classmethod 1299 def get_valid_manager(cls): 1300 return cls.valid_objects 1301 1302 1303 class Manipulator(object): 1304 """ 1305 Force default manipulators to look only at valid objects - 1306 otherwise they will match against invalid objects when checking 1307 uniqueness. 1308 """ 1309 @classmethod 1310 def _prepare(cls, model): 1311 super(ModelWithInvalid.Manipulator, cls)._prepare(model) 1312 cls.manager = model.valid_objects 1313 1314 1315class ModelWithAttributes(object): 1316 """ 1317 Mixin class for models that have an attribute model associated with them. 1318 The attribute model is assumed to have its value field named "value". 1319 """ 1320 1321 def _get_attribute_model_and_args(self, attribute): 1322 """ 1323 Subclasses should override this to return a tuple (attribute_model, 1324 keyword_args), where attribute_model is a model class and keyword_args 1325 is a dict of args to pass to attribute_model.objects.get() to get an 1326 instance of the given attribute on this object. 1327 """ 1328 raise NotImplementedError 1329 1330 1331 def set_attribute(self, attribute, value): 1332 attribute_model, get_args = self._get_attribute_model_and_args( 1333 attribute) 1334 attribute_object, _ = attribute_model.objects.get_or_create(**get_args) 1335 attribute_object.value = value 1336 attribute_object.save() 1337 1338 1339 def delete_attribute(self, attribute): 1340 attribute_model, get_args = self._get_attribute_model_and_args( 1341 attribute) 1342 try: 1343 attribute_model.objects.get(**get_args).delete() 1344 except attribute_model.DoesNotExist: 1345 pass 1346 1347 1348 def set_or_delete_attribute(self, attribute, value): 1349 if value is None: 1350 self.delete_attribute(attribute) 1351 else: 1352 self.set_attribute(attribute, value) 1353 1354 1355class ModelWithHashManager(dbmodels.Manager): 1356 """Manager for use with the ModelWithHash abstract model class""" 1357 1358 def create(self, **kwargs): 1359 raise Exception('ModelWithHash manager should use get_or_create() ' 1360 'instead of create()') 1361 1362 1363 def get_or_create(self, **kwargs): 1364 kwargs['the_hash'] = self.model._compute_hash(**kwargs) 1365 return super(ModelWithHashManager, self).get_or_create(**kwargs) 1366 1367 1368class ModelWithHash(dbmodels.Model): 1369 """Superclass with methods for dealing with a hash column""" 1370 1371 the_hash = dbmodels.CharField(max_length=40, unique=True) 1372 1373 objects = ModelWithHashManager() 1374 1375 class Meta: 1376 abstract = True 1377 1378 1379 @classmethod 1380 def _compute_hash(cls, **kwargs): 1381 raise NotImplementedError('Subclasses must override _compute_hash()') 1382 1383 1384 def save(self, force_insert=False, **kwargs): 1385 """Prevents saving the model in most cases 1386 1387 We want these models to be immutable, so the generic save() operation 1388 will not work. These models should be instantiated through their the 1389 model.objects.get_or_create() method instead. 1390 1391 The exception is that save(force_insert=True) will be allowed, since 1392 that creates a new row. However, the preferred way to make instances of 1393 these models is through the get_or_create() method. 1394 """ 1395 if not force_insert: 1396 # Allow a forced insert to happen; if it's a duplicate, the unique 1397 # constraint will catch it later anyways 1398 raise Exception('ModelWithHash is immutable') 1399 super(ModelWithHash, self).save(force_insert=force_insert, **kwargs) 1400