My favorites | Sign in
Project Logo
                
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
import wsgiref.handlers, os, sys, re, logging, urllib, md5
from google.appengine.ext.webapp import template
from google.appengine.api import users, urlfetch, memcache
from google.appengine.ext import webapp, db

inner_counter = ['visit_url_record','url_record','visit_host_record','host_record']

ga = """
<script type="text/javascript">
var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
</script>
<script type="text/javascript">
try {
var pageTracker = _gat._getTracker("UA-95317-5");
pageTracker._trackPageview();
} catch(err) {}</script>
"""

class UrlRecord(db.Model):
host = db.StringProperty()
url = db.StringProperty()
title = db.TextProperty()
count = db.IntegerProperty()
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)

class VisitRecord(db.Model):
url = db.StringProperty()
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)
user_agent = db.StringProperty()
address = db.StringProperty()

class Counter(db.Model):
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)
type = db.BooleanProperty()
name = db.StringProperty()
value= db.IntegerProperty()

class LocalUser(db.Model):
user = db.UserProperty()
created = db.DateTimeProperty(auto_now_add=True)
updated = db.DateTimeProperty(auto_now=True)


def add_count(name, delta):
counter = Counter.all().filter('name =', name).get()
if counter is None:
if name in inner_counter:
counter = Counter(name=name, value=delta, type=True)
else:
counter = Counter(name=name, value=delta, type=False)
else:
counter.value += delta
counter.put()

def get_count(name):
counter = Counter.all().filter('name =', name).get()
if counter is None:
if name in inner_counter:
counter = Counter(name=name, value=0, type=True)
else:
counter = Counter(name=name, value=0, type=False)
counter.put()
return counter.value
template_values = {}
class MainPage(webapp.RequestHandler):
def get(self):
db.delete(Counter.all().fetch(100))
db.delete(UrlRecord.all().fetch(100))
db.delete(VisitRecord.all().fetch(100))
try:
for k,v in self.request.headers.items():
logging.info('%s = %s ' %(k,v))
except:
pass
uri = self.request.uri
host = '%s://%s/' % (self.request.scheme, self.request.host)
if uri.find('?') != -1:
uri = urllib.unquote(uri.split('?')[0]) + '?' + uri.split('?')[-1]
else:
uri = urllib.unquote(self.request.uri)
url_list = uri.split('/')
local_host = '/'.join(url_list[0:4]) + '/'
path = os.path.join(os.path.dirname(__file__), 'index.html')
if uri == host:
self.response.out.write(template.render(path, template_values))
self.response.out.write(ga)
return
else:
remote_host = 'http://' + url_list[3] + '.blogspot.com/'
url = (remote_host + '/'.join(url_list[4:]))
logging.debug(unicode(url, 'utf-8'))
result = None
m_s = None
try:
m = md5.new()
m.update(unicode(url, 'utf-8'))
m_s = m.hexdigest()
result = memcache.get(m_s)
except:
pass
if result is None:
try:
result = urlfetch.fetch(url, headers=self.request.headers)
except:
template_values['error_msg'] = '[%s]' % url
self.response.out.write(template.render(path, template_values))
return
if result.status_code == 200:
self.response.headers = result.headers
if result.headers['Content-Type'].find('image') != -1:
self.response.out.write(result.content)
if m_s is not None:
memcache.add(m_s,result)
return
if result.headers['Content-Type'].find('html') != -1:
self.response.out.write(self.replace(result.content,{remote_host:local_host,}))
self.response.out.write(ga)
else:
template_values['error_msg'] = '[%s]' % url
self.response.out.write(template.render(path, template_values))
else:
self.response.headers = result.headers
self.response.out.write(result.content)
def post(self):
stuff_url = self.request.get('stuff_url')
if stuff_url == '':
self.redirect('/')
else:
self.redirect('/%s' % stuff_url)
pass


def replace(self,content,replace_str_dict={}):
for k,v in replace_str_dict.items():
content = content.replace(k,v)
return content

def main():
application = webapp.WSGIApplication(
[('/.*', MainPage),],
debug=False)
wsgiref.handlers.CGIHandler().run(application)

if __name__ == "__main__":
main()
Show details Hide details

Change log

r28 by ibeyond on Oct 09, 2009   Diff
[No log message]
Go to: 
Project members, sign in to write a code review

Older revisions

r27 by ibeyond on May 27, 2009   Diff
[No log message]
r26 by ibeyond on Jul 24, 2008   Diff
取消Wikipedia的代理。
取消浏览全部blog的链接。
r25 by iBeyond on Jun 29, 2008   Diff
增加Robots.txt文件,阻止维基百科的搜索引擎检索。
All revisions of this file

File info

Size: 5554 bytes, 149 lines
Hosted by Google Code