importexport.py 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990
  1. import csv
  2. import copy
  3. from django import forms
  4. from django.apps import apps
  5. from django.contrib.contenttypes.models import ContentType
  6. from django.db import transaction
  7. from wagtail.core.models import Page
  8. from wagtailimportexport.forms import ImportFromFileForm
  9. from wagtailimportexport.importing import update_page_references
  10. from coderedcms.forms import get_page_model_choices
  11. class ImportPagesFromCSVFileForm(ImportFromFileForm):
  12. page_type = forms.ChoiceField(choices=get_page_model_choices)
  13. @transaction.atomic()
  14. def import_pages(import_data, parent_page):
  15. """
  16. Overwrite of the wagtailimportexport `import_page` function to handle generic csvs.
  17. The standard `import_pages` assumes that your pages will have a pk from the exported
  18. json files. It does not facilitate the idea that the pages you import will be
  19. new pages.
  20. """
  21. pages_by_original_id = {}
  22. # First create the base Page records; these contain no foreign keys, so this allows us to
  23. # build a complete mapping from old IDs to new IDs before we go on to importing the
  24. # specific page models, which may require us to rewrite page IDs within foreign keys / rich
  25. # text / streamfields.
  26. page_content_type = ContentType.objects.get_for_model(Page)
  27. for page_record in import_data['pages']:
  28. # build a base Page instance from the exported content
  29. # (so that we pick up its title and other core attributes)
  30. page = Page.from_serializable_data(page_record['content'])
  31. # clear id and treebeard-related fields so that
  32. # they get reassigned when we save via add_child
  33. page.id = None
  34. page.path = None
  35. page.depth = None
  36. page.numchild = 0
  37. page.url_path = None
  38. page.content_type = page_content_type
  39. parent_page.add_child(instance=page)
  40. # Custom Code to add the new pk back into the original page record.
  41. page_record['content']['pk'] = page.pk
  42. pages_by_original_id[page.id] = page
  43. for page_record in import_data['pages']:
  44. # Get the page model of the source page by app_label and model name
  45. # The content type ID of the source page is not in general the same
  46. # between the source and destination sites but the page model needs
  47. # to exist on both.
  48. # Raises LookupError exception if there is no matching model
  49. model = apps.get_model(page_record['app_label'], page_record['model'])
  50. specific_page = model.from_serializable_data(
  51. page_record['content'],
  52. check_fks=False,
  53. strict_fks=False
  54. )
  55. base_page = pages_by_original_id[specific_page.id]
  56. specific_page.page_ptr = base_page
  57. specific_page.__dict__.update(base_page.__dict__)
  58. specific_page.content_type = ContentType.objects.get_for_model(model)
  59. update_page_references(specific_page, pages_by_original_id)
  60. specific_page.save()
  61. return len(import_data['pages'])
  62. def convert_csv_to_json(csv_file, page_type):
  63. pages_json = {"pages": []}
  64. default_page_data = {"app_label": "website", "content": {"pk": None}, "model": page_type}
  65. pages_csv_dict = csv.DictReader(csv_file)
  66. for row in pages_csv_dict:
  67. page_dict = copy.deepcopy(default_page_data)
  68. page_dict['content'].update(row)
  69. pages_json['pages'].append(page_dict)
  70. return pages_json