2 # Copyright 2013 The Chromium Authors. All rights reserved.
3 # Use of this source code is governed by a BSD-style license that can be
4 # found in the LICENSE file.
7 from copy
import deepcopy
8 from cStringIO
import StringIO
9 from functools
import partial
10 from hashlib
import sha1
11 from random
import random
13 from zipfile
import ZipFile
15 from caching_file_system
import CachingFileSystem
16 from file_system
import FileNotFoundError
, StatInfo
17 from fake_url_fetcher
import FakeURLFSFetcher
, MockURLFetcher
18 from local_file_system
import LocalFileSystem
19 from new_github_file_system
import GithubFileSystem
20 from object_store_creator
import ObjectStoreCreator
21 from test_file_system
import TestFileSystem
24 class _TestBundle(object):
25 '''Bundles test file data with a GithubFileSystem and test utilites. Create
26 GithubFileSystems via |CreateGfs()|, the Fetcher it uses as |fetcher|,
27 randomly mutate its contents via |Mutate()|, and access the underlying zip
34 'zipfile/hello.txt': 'world',
35 'zipfile/readme': 'test zip',
36 'zipfile/dir/file1': 'contents',
37 'zipfile/dir/file2': 'more contents'
43 'HEAD': self
._MakeShaJson
(self
._GenerateHash
())
45 'zipball': self
._ZipFromFiles
(self
.files
)
51 def CreateGfsAndFetcher(self
):
53 def create_mock_url_fetcher(base_path
):
55 fetchers
.append(MockURLFetcher(
56 FakeURLFSFetcher(TestFileSystem(self
._test
_files
), base_path
)))
59 # Constructing |gfs| will create a fetcher.
60 gfs
= GithubFileSystem
.ForTest(
61 'changing-repo', create_mock_url_fetcher
, path
='')
62 assert len(fetchers
) == 1
63 return gfs
, fetchers
[0]
66 fake_version
= self
._GenerateHash
()
67 fake_data
= self
._GenerateHash
()
68 self
.files
['zipfile/hello.txt'] = fake_data
69 self
.files
['zipfile/new-file'] = fake_data
70 self
.files
['zipfile/dir/file1'] = fake_data
71 self
._test
_files
['test_owner']['changing-repo']['zipball'] = (
72 self
._ZipFromFiles
(self
.files
))
73 self
._test
_files
['test_owner']['changing-repo']['commits']['HEAD'] = (
74 self
._MakeShaJson
(fake_version
))
75 return fake_version
, fake_data
77 def _GenerateHash(self
):
78 '''Generates an arbitrary SHA1 hash.
80 return sha1(str(random())).hexdigest()
82 def _MakeShaJson(self
, hash_value
):
83 commit_json
= json
.loads(deepcopy(LocalFileSystem('').ReadSingle(
84 'test_data/github_file_system/test_owner/repo/commits/HEAD').Get()))
85 commit_json
['sha'] = hash_value
86 return json
.dumps(commit_json
)
88 def _ZipFromFiles(self
, file_dict
):
90 zipfile
= ZipFile(string
, 'w')
91 for filename
, contents
in file_dict
.iteritems():
92 zipfile
.writestr(filename
, contents
)
94 return string
.getvalue()
97 class TestGithubFileSystem(unittest
.TestCase
):
99 self
._gfs
= GithubFileSystem
.ForTest(
100 'repo', partial(FakeURLFSFetcher
, LocalFileSystem('')))
101 # Start and finish the repository load.
102 self
._cgfs
= CachingFileSystem(self
._gfs
, ObjectStoreCreator
.ForTest())
104 def testReadDirectory(self
):
105 self
._gfs
.Refresh().Get()
107 sorted(['requirements.txt', '.gitignore', 'README.md', 'src/']),
108 sorted(self
._gfs
.ReadSingle('').Get()))
110 sorted(['__init__.notpy', 'hello.notpy']),
111 sorted(self
._gfs
.ReadSingle('src/').Get()))
113 def testReadFile(self
):
114 self
._gfs
.Refresh().Get()
116 '# Compiled Python files\n'
119 self
.assertEqual(expected
, self
._gfs
.ReadSingle('.gitignore').Get())
121 def testMultipleReads(self
):
122 self
._gfs
.Refresh().Get()
124 self
._gfs
.ReadSingle('requirements.txt').Get(),
125 self
._gfs
.ReadSingle('requirements.txt').Get())
128 self
._gfs
.Refresh().Get()
130 'src/': sorted(['hello.notpy', '__init__.notpy']),
131 '': sorted(['requirements.txt', '.gitignore', 'README.md', 'src/'])
134 read
= self
._gfs
.Read(['', 'src/']).Get()
135 self
.assertEqual(expected
['src/'], sorted(read
['src/']))
136 self
.assertEqual(expected
[''], sorted(read
['']))
139 # This is the hash value from the zip on disk.
140 real_hash
= 'c36fc23688a9ec9e264d3182905dc0151bfff7d7'
142 self
._gfs
.Refresh().Get()
143 dir_stat
= StatInfo(real_hash
, {
144 'hello.notpy': StatInfo(real_hash
),
145 '__init__.notpy': StatInfo(real_hash
)
148 self
.assertEqual(StatInfo(real_hash
), self
._gfs
.Stat('README.md'))
149 self
.assertEqual(StatInfo(real_hash
), self
._gfs
.Stat('src/hello.notpy'))
150 self
.assertEqual(dir_stat
, self
._gfs
.Stat('src/'))
152 def testBadReads(self
):
153 self
._gfs
.Refresh().Get()
154 self
.assertRaises(FileNotFoundError
, self
._gfs
.Stat
, 'DONT_README.md')
155 self
.assertRaises(FileNotFoundError
,
156 self
._gfs
.ReadSingle('DONT_README.md').Get
)
158 def testCachingFileSystem(self
):
159 self
._cgfs
.Refresh().Get()
160 initial_cgfs_read_one
= self
._cgfs
.ReadSingle('src/hello.notpy').Get()
162 self
.assertEqual(initial_cgfs_read_one
,
163 self
._gfs
.ReadSingle('src/hello.notpy').Get())
164 self
.assertEqual(initial_cgfs_read_one
,
165 self
._cgfs
.ReadSingle('src/hello.notpy').Get())
167 initial_cgfs_read_two
= self
._cgfs
.Read(
168 ['README.md', 'requirements.txt']).Get()
171 initial_cgfs_read_two
,
172 self
._gfs
.Read(['README.md', 'requirements.txt']).Get())
174 initial_cgfs_read_two
,
175 self
._cgfs
.Read(['README.md', 'requirements.txt']).Get())
177 def testWithoutRefresh(self
):
178 # Without refreshing it will still read the content from blobstore, and it
179 # does this via the magic of the FakeURLFSFetcher.
180 self
.assertEqual(['__init__.notpy', 'hello.notpy'],
181 sorted(self
._gfs
.ReadSingle('src/').Get()))
183 def testRefresh(self
):
184 test_bundle
= _TestBundle()
185 gfs
, fetcher
= test_bundle
.CreateGfsAndFetcher()
187 # It shouldn't fetch until Refresh does so; then it will do 2, one for the
188 # stat, and another for the read.
189 self
.assertTrue(*fetcher
.CheckAndReset())
191 self
.assertTrue(*fetcher
.CheckAndReset(fetch_count
=1,
193 fetch_resolve_count
=1))
195 # Refresh is just an alias for Read('').
197 self
.assertTrue(*fetcher
.CheckAndReset())
199 initial_dir_read
= sorted(gfs
.ReadSingle('').Get())
200 initial_file_read
= gfs
.ReadSingle('dir/file1').Get()
202 version
, data
= test_bundle
.Mutate()
204 # Check that changes have not effected the file system yet.
205 self
.assertEqual(initial_dir_read
, sorted(gfs
.ReadSingle('').Get()))
206 self
.assertEqual(initial_file_read
, gfs
.ReadSingle('dir/file1').Get())
207 self
.assertNotEqual(StatInfo(version
), gfs
.Stat(''))
209 gfs
, fetcher
= test_bundle
.CreateGfsAndFetcher()
211 self
.assertTrue(*fetcher
.CheckAndReset(fetch_count
=1,
213 fetch_resolve_count
=1))
215 # Check that the changes have affected the file system.
216 self
.assertEqual(data
, gfs
.ReadSingle('new-file').Get())
217 self
.assertEqual(test_bundle
.files
['zipfile/dir/file1'],
218 gfs
.ReadSingle('dir/file1').Get())
219 self
.assertEqual(StatInfo(version
), gfs
.Stat('new-file'))
221 # Regression test: ensure that reading the data after it's been mutated,
222 # but before Refresh() has been realised, still returns the correct data.
223 gfs
, fetcher
= test_bundle
.CreateGfsAndFetcher()
224 version
, data
= test_bundle
.Mutate()
226 refresh_future
= gfs
.Refresh()
227 self
.assertTrue(*fetcher
.CheckAndReset(fetch_count
=1, fetch_async_count
=1))
229 self
.assertEqual(data
, gfs
.ReadSingle('new-file').Get())
230 self
.assertEqual(test_bundle
.files
['zipfile/dir/file1'],
231 gfs
.ReadSingle('dir/file1').Get())
232 self
.assertEqual(StatInfo(version
), gfs
.Stat('new-file'))
235 self
.assertTrue(*fetcher
.CheckAndReset(fetch_resolve_count
=1))
237 def testGetThenRefreshOnStartup(self
):
238 # Regression test: Test that calling Get() but never resolving the future,
239 # then Refresh()ing the data, causes the data to be refreshed.
240 test_bundle
= _TestBundle()
241 gfs
, fetcher
= test_bundle
.CreateGfsAndFetcher()
242 self
.assertTrue(*fetcher
.CheckAndReset())
244 # Get a predictable version.
245 version
, data
= test_bundle
.Mutate()
247 read_future
= gfs
.ReadSingle('hello.txt')
248 # Fetch for the Stat(), async-fetch for the Read().
249 self
.assertTrue(*fetcher
.CheckAndReset(fetch_count
=1, fetch_async_count
=1))
251 refresh_future
= gfs
.Refresh()
252 self
.assertTrue(*fetcher
.CheckAndReset())
254 self
.assertEqual(data
, read_future
.Get())
255 self
.assertTrue(*fetcher
.CheckAndReset(fetch_resolve_count
=1))
256 self
.assertEqual(StatInfo(version
), gfs
.Stat('hello.txt'))
257 self
.assertTrue(*fetcher
.CheckAndReset())
259 # The fetch will already have been resolved, so resolving the Refresh won't
262 self
.assertTrue(*fetcher
.CheckAndReset())
264 # Read data should not have changed.
265 self
.assertEqual(data
, gfs
.ReadSingle('hello.txt').Get())
266 self
.assertEqual(StatInfo(version
), gfs
.Stat('hello.txt'))
267 self
.assertTrue(*fetcher
.CheckAndReset())
270 if __name__
== '__main__':