fabianvf · April 13, 2015 15:28 · brianjgeiger · Apr 13, 2015 · walkerh · Apr 13, 2015
diff --git a/storage.py b/storage.py
 import os
 import json

 from scrapi.processing.base import BaseProcessor


 class StorageProcessor(BaseProcessor):
    NAME = 'storage'

    def process_raw(self, raw):
        filename = 'archive/{}/{}/raw.{}'.format(raw['source'], raw['docID'], raw['filetype'])
        if not os.path.exists(os.path.dirname(filename)):
            os.makedirs(os.path.dirname(filename))

        with open(filename, 'w') as f:
            f.write(json.dumps(raw.attributes, indent=4))

    def process_normalized(self, raw, normalized):
        filename = 'archive/{}/{}/normalized.json'.format(raw['source'], raw['docID'], raw['filetype'])
        if not os.path.exists(os.path.dirname(filename)):
            os.makedirs(os.path.dirname(filename))

        with open(filename, 'w') as f:
            f.write(json.dumps(normalized.attributes, indent=4))
	import os
	import json

	from scrapi.processing.base import BaseProcessor


	class StorageProcessor(BaseProcessor):
	NAME = 'storage'

	def process_raw(self, raw):
	filename = 'archive/{}/{}/raw.{}'.format(raw['source'], raw['docID'], raw['filetype'])
	if not os.path.exists(os.path.dirname(filename)):
	os.makedirs(os.path.dirname(filename))

	with open(filename, 'w') as f:
	f.write(json.dumps(raw.attributes, indent=4))

	def process_normalized(self, raw, normalized):
	filename = 'archive/{}/{}/normalized.json'.format(raw['source'], raw['docID'], raw['filetype'])
	if not os.path.exists(os.path.dirname(filename)):
	os.makedirs(os.path.dirname(filename))

	with open(filename, 'w') as f:
	f.write(json.dumps(normalized.attributes, indent=4))
No results found