chrome/common/extensions/docs/server2/subversion_file_system.py - Issue 10828235: Extensions Docs Server: Efficient MemcacheFileSystem

Side by Side Diff: chrome/common/extensions/docs/server2/subversion_file_system.py

Issue 10828235: Extensions Docs Server: Efficient MemcacheFileSystem (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Created 8 years, 4 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

« chrome/common/extensions/docs/server2/local_file_system.py ('K') | « chrome/common/extensions/docs/server2/memcache_file_system_test.py ('k') | chrome/common/extensions/docs/server2/subversion_file_system_test.py » ('j') | chrome/common/extensions/docs/server2/subversion_file_system_test.py » ('J')
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

OLD	NEW
1 # Copyright (c) 2012 The Chromium Authors. All rights reserved.	1 # Copyright (c) 2012 The Chromium Authors. All rights reserved.

2 # Use of this source code is governed by a BSD-style license that can be	2 # Use of this source code is governed by a BSD-style license that can be

3 # found in the LICENSE file.	3 # found in the LICENSE file.

4	4

5 import re	5 import re

6 import xml.dom.minidom as xml	6 import xml.dom.minidom as xml

	7 from xml.parsers.expat import ExpatError

7	8

8 import file_system	9 import file_system

9 from future import Future	10 from future import Future

10	11

11 class SubversionFileSystem(file_system.FileSystem):	12 class SubversionFileSystem(file_system.FileSystem):

12 """Class to fetch resources from src.chromium.org.	13 """Class to fetch resources from src.chromium.org.

13 """	14 """

14 def __init__(self, fetcher):	15 def __init__(self, fetcher, stat_fetcher):

15 self._fetcher = fetcher	16 self._fetcher = fetcher

	17 self._stat_fetcher = stat_fetcher

16	18

17 def Read(self, paths, binary=False):	19 def Read(self, paths, binary=False):

18 return Future(delegate=_AsyncFetchFuture(paths, self._fetcher, binary))	20 return Future(delegate=_AsyncFetchFuture(paths, self._fetcher, binary))

19	21

	22 def _ParseHTML(self, html):

	23 """Unfortunately, the viewvc page has a stray </div> tag, so this takes care

	24 of all mismatched tags.

	25 """

	26 try:

	27 return xml.parseString(html)

	28 except ExpatError as e:

	29 new_html = []

	30 for lineno, line in enumerate(html.split('\n')):

	31 if e.lineno != lineno + 1:

	32 new_html.append(line)

	33 return self._ParseHTML('\n'.join(new_html))

	34

	35 def _CreateStatInfo(self, html):

	36 dom = self._ParseHTML(html)

	37 # Brace yourself, this is about to get ugly. The page returned from viewvc

	38 # was not the prettiest.
	not at google - send to devlin 2012/08/10 06:42:24 heh. Let's hope it doesn't change; but if it does, heh. Let's hope it doesn't change; but if it does, make sure we can catch it and update this function + redeploy.
	39 tds = dom.getElementsByTagName('td')

	40 a_list = []

	41 found = False

	42 dir_revision = None

	43 for td in tds:

	44 if found:

	45 dir_revision = td.getElementsByTagName('a')[0].firstChild.nodeValue

	46 found = False

	47 a_list.extend(td.getElementsByTagName('a'))

	48 if (td.firstChild is not None and

	49 td.firstChild.nodeValue == 'Directory revision:'):

	50 found = True

	51 child_revisions = {}

	52 for i in range(len(a_list)):

	53 name = a_list[i].getAttribute('name')

	54 if name:

	55 rev = a_list[i + 1].getElementsByTagName('strong')[0]

	56 if 'file' in a_list[i + 1].getAttribute('title'):

	57 child_revisions[name] = rev.firstChild.nodeValue

	58 else:

	59 child_revisions[name + '/'] = rev.firstChild.nodeValue

	60 return self.StatInfo(dir_revision, child_revisions)

	61

20 def Stat(self, path):	62 def Stat(self, path):

21 directory = path.rsplit('/', 1)[0]	63 directory = path.rsplit('/', 1)[0]

22 dir_html = self._fetcher.Fetch(directory + '/').content	64 dir_html = self._stat_fetcher.Fetch(directory + '/').content

23 return self.StatInfo(int(re.search('([0-9]+)', dir_html).group(0)))	65 return self._CreateStatInfo(dir_html)

24	66

25 class _AsyncFetchFuture(object):	67 class _AsyncFetchFuture(object):

26 def __init__(self, paths, fetcher, binary):	68 def __init__(self, paths, fetcher, binary):

27 # A list of tuples of the form (path, Future).	69 # A list of tuples of the form (path, Future).

28 self._fetches = []	70 self._fetches = []

29 self._value = {}	71 self._value = {}

30 self._error = None	72 self._error = None

31 self._fetches = [(path, fetcher.FetchAsync(path)) for path in paths]	73 self._fetches = [(path, fetcher.FetchAsync(path)) for path in paths]

32 self._binary = binary	74 self._binary = binary

33	75

(...skipping 12 matching lines...) Expand all Loading...
46 elif path.endswith('/'):	88 elif path.endswith('/'):

47 self._value[path] = self._ListDir(result.content)	89 self._value[path] = self._ListDir(result.content)

48 elif not self._binary:	90 elif not self._binary:

49 self._value[path] = file_system._ProcessFileData(result.content, path)	91 self._value[path] = file_system._ProcessFileData(result.content, path)

50 else:	92 else:

51 self._value[path] = result.content	93 self._value[path] = result.content

52 if self._error is not None:	94 if self._error is not None:

53 raise self._error	95 raise self._error

54 return self._value	96 return self._value

55	97

OLD	NEW