forked from Arachnid/bloggart
/
models.py
176 lines (150 loc) · 5.57 KB
/
models.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
from lib import aetycoon
import hashlib
import re
from google.appengine.ext import db
from google.appengine.ext import deferred
from google.appengine.api import urlfetch
import config
import generators
import markup
import static
import utils
from bs4 import BeautifulSoup
import logging
from webmentiontools.send import WebmentionSend
import urlparse
from django.utils import simplejson
if config.default_markup in markup.MARKUP_MAP:
DEFAULT_MARKUP = config.default_markup
else:
DEFAULT_MARKUP = 'html'
def is_absolute(url):
return bool(urlparse.urlparse(url).netloc)
class BlogPost(db.Model):
# The URL path to the blog post. Posts have a path iff they are published.
path = db.StringProperty()
title = db.StringProperty(required=True, indexed=False)
body_markup = db.StringProperty(choices=set(markup.MARKUP_MAP),
default=DEFAULT_MARKUP)
body = db.TextProperty(required=True)
tags = aetycoon.SetProperty(basestring, indexed=False)
published = db.DateTimeProperty()
updated = db.DateTimeProperty(auto_now=False)
deps = aetycoon.PickleProperty()
author = db.StringProperty()
recipients = db.StringListProperty()
cc = db.StringListProperty()
bcc = db.StringListProperty()
date_sent = db.DateTimeProperty()
headers = db.StringProperty()
@aetycoon.TransformProperty(tags)
def normalized_tags(tags):
return list(set(utils.slugify(x.lower()) for x in tags))
@property
def tag_pairs(self):
return [(x, utils.slugify(x.lower())) for x in self.tags]
@property
def rendered(self):
"""Returns the rendered body."""
return markup.render_body(self)
@property
def summary(self):
"""Returns a summary of the blog post."""
return markup.render_summary(self)
@property
def hash(self):
val = (self.title, self.body, self.published)
return hashlib.sha1(str(val)).hexdigest()
@property
def summary_hash(self):
val = (self.title, self.summary, self.tags, self.published)
return hashlib.sha1(str(val)).hexdigest()
@property
def custom_headers(self):
all_headers = simplejson.loads(self.headers)
simplified_headers = [x for x in all_headers if 'placeholder' not in x]
if len(simplified_headers) > 0:
return simplified_headers
return None
def publish(self):
regenerate = False
if not self.path:
num = 0
content = None
while not content:
path = utils.format_post_path(self, num)
content = static.add(path, '', config.html_mime_type)
num += 1
self.path = path
self.put()
# Force regenerate on new publish. Also helps with generation of
# chronologically previous and next page.
regenerate = True
deferred.defer(self.mention) # after publishing for the first time, try to ping sites you mention
if not self.deps:
self.deps = {}
for generator_class, deps in self.get_deps(regenerate=regenerate):
for dep in deps:
if generator_class.can_defer:
deferred.defer(generator_class.generate_resource, None, dep)
else:
generator_class.generate_resource(self, dep)
self.put()
def mention(self):
if not self.path:
return
else:
full_path = 'http://%s%s' % (config.host, self.path) # TODO: don't hardcode scheme, what about https?
if self.body_markup != 'html':
return # currently only works if the writing is done in HTML, I believe, a needless limitation, should instead wait until it's rendered
soup = BeautifulSoup(self.body)
any_match = re.compile('.*')
anchors = soup.findAll('a', attrs={'href':any_match})
for a in anchors:
href = a.get('href')
if not is_absolute(href):
continue
mention = WebmentionSend(full_path, href)
success = mention.send()
if success:
logging.info('Mention of %s was accepted.' % href)
else:
logging.info('Mention of %s was not accepted.' % href)
def remove(self):
if not self.is_saved():
return
if not self.deps:
self.deps = {}
# It is important that the get_deps() return the post dependency
# before the list dependencies as the BlogPost entity gets deleted
# while calling PostContentGenerator.
for generator_class, deps in self.get_deps(regenerate=True):
for dep in deps:
if generator_class.can_defer:
deferred.defer(generator_class.generate_resource, None, dep)
else:
if generator_class.name() == 'PostContentGenerator':
generator_class.generate_resource(self, dep, action='delete')
self.delete()
else:
generator_class.generate_resource(self, dep)
def get_deps(self, regenerate=False):
for generator_class in generators.generator_list:
new_deps = set(generator_class.get_resource_list(self))
new_etag = generator_class.get_etag(self)
old_deps, old_etag = self.deps.get(generator_class.name(), (set(), None))
if new_etag != old_etag or regenerate:
# If the etag has changed, regenerate everything
to_regenerate = new_deps | old_deps
else:
# Otherwise just regenerate the changes
to_regenerate = new_deps ^ old_deps
self.deps[generator_class.name()] = (new_deps, new_etag)
yield generator_class, to_regenerate
class VersionInfo(db.Model):
bloggart_major = db.IntegerProperty(required=True)
bloggart_minor = db.IntegerProperty(required=True)
bloggart_rev = db.IntegerProperty(required=True)
@property
def bloggart_version(self):
return (self.bloggart_major, self.bloggart_minor, self.bloggart_rev)