Version bump. Adding some logging. Tweaking link title lookup.

codekoala · codekoala · commit 7d3ed4b0e76d · 2011-08-15T15:53:56.000-04:00
diff --git a/articles/__init__.py b/articles/__init__.py
@@ -1,4 +1,4 @@
-__version__ = '2.2.1'
+__version__ = '2.3.0'
 
 from articles.directives import *
 try:
diff --git a/articles/fixtures/tags.json b/articles/fixtures/tags.json
@@ -3,14 +3,16 @@
         "pk": 1,
         "model": "articles.tag",
         "fields": {
-            "name": "Demo"
+            "name": "Demo",
+            "slug": "demo"
         }
     },
     {
         "pk": 2,
         "model": "articles.tag",
         "fields": {
-            "name": "This Is A Test"
+            "name": "This Is A Test",
+            "slug": "this-is-a-test"
         }
     }
 ]
diff --git a/articles/models.py b/articles/models.py
@@ -1,5 +1,6 @@
 from base64 import encodestring
 from datetime import datetime
+import logging
 import mimetypes
 import re
 import urllib
@@ -37,21 +38,32 @@
 
 # regex used to find links in an article
 LINK_RE = re.compile('<a.*?href="(.*?)".*?>(.*?)</a>', re.I|re.M)
-TITLE_RE = re.compile('<title>(.*?)</title>', re.I|re.M)
+TITLE_RE = re.compile('<title.*?>(.*?)</title>', re.I|re.M)
 TAG_RE = re.compile('[^a-z0-9\-_\+\:\.]?', re.I)
 
+log = logging.getLogger(__file__)
+
 def get_name(user):
     """
     Provides a way to fall back to a user's username if their full name has not
     been entered.
     """
+
     key = 'username_for_%s' % user.id
+
+    log.debug('Looking for "%s" in cache (%s)' % (key, user))
     name = cache.get(key)
     if not name:
+        log.debug('Name not found')
+
         if len(user.get_full_name().strip()):
+            log.debug('Using full name')
             name = user.get_full_name()
         else:
+            log.debug('Using username')
             name = user.username
+
+        log.debug('Caching %s as "%s" for a while' % (key, name))
         cache.set(key, name, 86400)
 
     return name
@@ -70,11 +82,15 @@ def clean_tag(name):
 
         name = name.replace(' ', '-').encode('ascii', 'ignore')
         name = TAG_RE.sub('', name)
-        return name.lower().strip()
+        clean = name.lower().strip()
+
+        log.debug('Cleaned tag "%s" to "%s"' % (name, clean))
+        return clean
 
     def save(self, *args, **kwargs):
         """Cleans up any characters I don't want in a URL"""
 
+        log.debug('Ensuring that tag "%s" has a slug' % (self,))
         self.slug = Tag.clean_tag(self.name)
         super(Tag, self).save(*args, **kwargs)
 
@@ -96,6 +112,7 @@ class Meta:
         ordering = ('name',)
 
 class ArticleStatusManager(models.Manager):
+
     def default(self):
         default = self.all()[:1]
 
@@ -122,10 +139,11 @@ def __unicode__(self):
             return self.name
 
 class ArticleManager(models.Manager):
+
     def active(self):
         """
-        Retrieves all active articles which have been published and have not yet
-        expired.
+        Retrieves all active articles which have been published and have not
+        yet expired.
         """
         now = datetime.now()
         return self.get_query_set().filter(
@@ -185,9 +203,7 @@ class Article(models.Model):
     objects = ArticleManager()
 
     def __init__(self, *args, **kwargs):
-        """
-        Make sure that we have some rendered content to use.
-        """
+        """Makes sure that we have some rendered content to use"""
 
         super(Article, self).__init__(*args, **kwargs)
 
@@ -208,9 +224,8 @@ def __unicode__(self):
         return self.title
 
     def save(self, *args, **kwargs):
-        """
-        Renders the article using the appropriate markup language.
-        """
+        """Renders the article using the appropriate markup language."""
+
         using = kwargs.get('using', DEFAULT_DB)
 
         self.do_render_markup()
@@ -372,51 +387,48 @@ def _get_article_links(self):
         used as the title.  Once a title is determined, it is cached for a week
         before it will be requested again.
         """
-        links = {}
-        keys = []
+
+        links = []
 
         # find all links in the article
+        log.debug('Locating links in article: %s' % (self,))
         for link in LINK_RE.finditer(self.rendered_content):
             url = link.group(1)
+            log.debug('Do we have a title for "%s"?' % (url,))
             key = 'href_title_' + encodestring(url).strip()
 
             # look in the cache for the link target's title
-            if not cache.get(key):
+            title = cache.get(key)
+            if title is None:
+                log.debug('Nope... Getting it and caching it.')
                 title = link.group(2)
 
                 if LOOKUP_LINK_TITLE:
                     try:
+                        log.debug('Looking up title for URL: %s' % (url,))
                         # open the URL
                         c = urllib.urlopen(url)
                         html = c.read()
                         c.close()
 
                         # try to determine the title of the target
-                        title = TITLE_RE.search(html)
-                        if title: title = title.group(1)
+                        title_m = TITLE_RE.search(html)
+                        if title_m:
+                            title = title_m.group(1)
+                            log.debug('Found title: %s' % (title,))
                     except:
                         # if anything goes wrong (ie IOError), use the link's text
-                        pass
+                        log.warn('Failed to retrieve the title for "%s"; using link text "%s"' % (url, title))
 
                 # cache the page title for a week
+                log.debug('Using "%s" as title for "%s"' % (title, url))
                 cache.set(key, title, 604800)
 
-            # get the link target's title from cache
-            val = cache.get(key)
-            if val:
-                # add it to the list of links and titles
-                links[url] = val
-
-                # don't duplicate links to the same page
-                if url not in keys: keys.append(url)
-
-        # now go thru and sort the links according to where they appear in the
-        # article
-        sorted = []
-        for key in keys:
-            sorted.append((key, links[key]))
+            # add it to the list of links and titles
+            if url not in (l[0] for l in links):
+                links.append((url, title))
 
-        return tuple(sorted)
+        return tuple(links)
     links = property(_get_article_links)
 
     def _get_word_count(self):
diff --git a/articles/static/css/jquery.autocomplete.css b/articles/static/css/jquery.autocomplete.css
@@ -20,7 +20,7 @@
 	cursor: default;
 	display: block;
 	/*
-	if width will be 100% horizontal scrollbar will apear
+	if width will be 100% horizontal scrollbar will appear
 	when scroll mode will be used
 	*/
 	/*width: 100%;*/
diff --git a/articles/templates/404.html b/articles/templates/404.html
@@ -0,0 +1,9 @@
+{% extends 'base.html' %}
+
+{% block title %}Page Not Found{% endblock %}
+
+{% block content %}
+<h1>Page Not Found</h1>
+
+<p>The page you requested does not exist on this site.  Sorry man!</p>
+{% endblock %}
diff --git a/articles/tests.py b/articles/tests.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 from django.contrib.auth.models import User
 from django.test import TestCase
 from django.test.client import Client
diff --git a/sample/articles_demo/demo.db b/sample/articles_demo/demo.db
diff --git a/sample/articles_demo/settings.py b/sample/articles_demo/settings.py
@@ -104,6 +104,8 @@
 
     'articles',
     'south',
+
+    'django_coverage',
 )
 
 # Change this to be your Disqus site's short name

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-__version__ = '2.2.1'`
	`1`	`+__version__ = '2.3.0'`
`2`	`2`
`3`	`3`	`from articles.directives import *`
`4`	`4`	`try:`
Original file line number	Diff line number	Diff line change
`@@ -3,14 +3,16 @@`
`3`	`3`	`"pk": 1,`
`4`	`4`	`"model": "articles.tag",`
`5`	`5`	`"fields": {`
`6`		`- "name": "Demo"`
	`6`	`+ "name": "Demo",`
	`7`	`+ "slug": "demo"`
`7`	`8`	`}`
`8`	`9`	`},`
`9`	`10`	`{`
`10`	`11`	`"pk": 2,`
`11`	`12`	`"model": "articles.tag",`
`12`	`13`	`"fields": {`
`13`		`- "name": "This Is A Test"`
	`14`	`+ "name": "This Is A Test",`
	`15`	`+ "slug": "this-is-a-test"`
`14`	`16`	`}`
`15`	`17`	`}`
`16`	`18`	`]`
Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,5 @@`
	`1`	`+# -- coding: utf-8 --`
	`2`	`+`
`1`	`3`	`from django.contrib.auth.models import User`
`2`	`4`	`from django.test import TestCase`
`3`	`5`	`from django.test.client import Client`
Original file line number	Diff line number	Diff line change
`@@ -104,6 +104,8 @@`
`104`	`104`
`105`	`105`	`'articles',`
`106`	`106`	`'south',`
	`107`	`+`
	`108`	`+ 'django_coverage',`
`107`	`109`	`)`
`108`	`110`
`109`	`111`	`# Change this to be your Disqus site's short name`