My favorites | Sign in
Project Logo
             
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
import wsgiref.handlers, os, sys, re, logging, urllib, md5
from google.appengine.ext.webapp import template
from google.appengine.api import users, urlfetch, memcache
from google.appengine.ext import webapp, db

inner_counter = ['visit_url_record','url_record','visit_host_record','host_record']

ga = """
<script type="text/javascript">
var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
</script>
<script type="text/javascript">
try {
var pageTracker = _gat._getTracker("UA-95317-5");
pageTracker._trackPageview();
} catch(err) {}</script>
"""

class UrlRecord(db.Model):
host = db.StringProperty()
url = db.StringProperty()
title = db.TextProperty()
count = db.IntegerProperty()
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)

class VisitRecord(db.Model):
url = db.StringProperty()
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)
user_agent = db.StringProperty()
address = db.StringProperty()

class Counter(db.Model):
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)
type = db.BooleanProperty()
name = db.StringProperty()
value= db.IntegerProperty()

class LocalUser(db.Model):
user = db.UserProperty()
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)


def add_count(name, delta):
counter = Counter.all().filter('name =', name).get()
if counter is None:
if name in inner_counter:
counter = Counter(name=name, value=delta, type=True)
else:
counter = Counter(name=name, value=delta, type=False)
else:
counter.value += delta
counter.put()

def get_count(name):
counter = Counter.all().filter('name =', name).get()
if counter is None:
if name in inner_counter:
counter = Counter(name=name, value=0, type=True)
else:
counter = Counter(name=name, value=0, type=False)
counter.put()
return counter.value

class MainPage(webapp.RequestHandler):
def get(self):
# db.delete(Counter.all().fetch(400))
# db.delete(UrlRecord.all().fetch(400))
# db.delete(VisitRecord.all().fetch(400))
try:
for k,v in self.request.headers.items():
logging.info('%s = %s ' %(k,v))
except:
pass
uri = self.request.uri
host = '%s://%s/' % (self.request.scheme, self.request.host)
user = users.get_current_user()
if user:
if LocalUser.all().filter('user =', user).get() is None:
LocalUser(user=user).put()
add_count('user_counter', 1)
if uri.find('?') != -1:
uri = urllib.unquote(uri.split('?')[0]) + '?' + uri.split('?')[-1]
else:
uri = urllib.unquote(self.request.uri)
url_list = uri.split('/')
local_host = '/'.join(url_list[0:4]) + '/'
path = os.path.join(os.path.dirname(__file__), 'index.html')
if uri == host:
template_values = self.create_template_values(host)
self.response.out.write(template.render(path, template_values))
self.response.out.write(ga)
return
else:
remote_host = 'http://' + url_list[3] + '.blogspot.com/'
url = (remote_host + '/'.join(url_list[4:]))
logging.debug(unicode(url, 'utf-8'))
result = None
m_s = None
try:
m = md5.new()
m.update(unicode(url, 'utf-8'))
m_s = m.hexdigest()
result = memcache.get(m_s)
except:
pass
if result is None:
try:
result = urlfetch.fetch(url, headers=self.request.headers)
except:
template_values = self.create_template_values(host)
template_values['error_msg'] = '[%s]' % url
self.response.out.write(template.render(path, template_values))
return
if result.status_code == 200:
self.response.headers = result.headers
if result.headers['Content-Type'].find('image') != -1:
self.response.out.write(result.content)
if m_s is not None:
memcache.add(m_s,result)
return
if result.headers['Content-Type'].find('html') != -1:
self.response.out.write(self.replace(result.content,{remote_host:local_host,}))
self.response.out.write(ga)
try:
match = re.search(u'<title>.*</title>',result.content)
title = ''
if match:
title = unicode(match.group(0),'utf-8').replace('<title>','').replace('</title>','')
url_record = UrlRecord.all().filter('url =', unicode(url,'utf-8')).get()
if url_record is None:
url_record = UrlRecord(host=remote_host, url=unicode(url,'utf-8'), title=db.Text(title), count=0)
add_count('url_record', 1)
url_record.count += 1
url_record.put()
add_count('visit_url_record', 1)
if url != remote_host: add_count(unicode(url, 'utf-8'), 1)
visit_record = VisitRecord.all().filter('address', self.request.remote_addr).filter('user_agent', unicode(self.request.user_agent, 'utf-8')).get()
if visit_record is None:
visit_record = VisitRecord(address=self.request.remote_addr,user_agent=self.request.user_agent)
visit_record.url = unicode(url, 'utf-8')
visit_record.put()
except Exception, e:
logging.exception(e)
pass
else:
template_values = self.create_template_values(host)
template_values['error_msg'] = '[%s]' % url
self.response.out.write(template.render(path, template_values))
else:
self.response.headers = result.headers
self.response.out.write(result.content)
def post(self):
stuff_url = self.request.get('stuff_url')
if stuff_url == '':
self.redirect('/')
else:
self.redirect('/%s' % stuff_url)
pass

def create_template_values(self,host):
return {
'top_host':Counter.all().filter('type =', False).order('-value').fetch(10),
'top_url':Counter.all().filter('type =', False).order('-value').fetch(10),
'login_url':users.create_login_url(self.request.uri),
'logout_url':users.create_logout_url(self.request.uri),
'host':host,
}

def replace(self,content,replace_str_dict={}):
for k,v in replace_str_dict.items():
content = content.replace(k,v)
return content

def main():
application = webapp.WSGIApplication(
[('/.*', MainPage),],
debug=False)
wsgiref.handlers.CGIHandler().run(application)

if __name__ == "__main__":
main()
Show details Hide details

Change log

r27 by ibeyond on May 27, 2009   Diff
[No log message]
Go to: 
Project members, sign in to write a code review

Older revisions

r26 by ibeyond on Jul 24, 2008   Diff
取消Wikipedia的代理。
取消浏览全部blog的链接。
r25 by iBeyond on Jun 29, 2008   Diff
增加Robots.txt文件,阻止维基百科的搜索引擎检索。
r24 by iBeyond on May 26, 2008   Diff
修正计数器Bug
All revisions of this file

File info

Size: 7828 bytes, 186 lines
Hosted by Google Code