> My only concern is in the commit message, about performance. A > change that has lots of files in it will cause many roundtrips to > p4d to do "p4 where" on each. When the files don't have much > edited content, this new approach will make the import take twice > as long, I'll guess. Do you have a big repository where you > could test that? I measured performance of "git p4 clone --use-client-spec" with a repository it has 1925 files, 50MB. Original: 8.05s user 32.02s system 15% cpu 4:25.34 total Apply patch: 9.02s user 53.19s system 14% cpu 6:56.41 total It is acceptable in my situation, but looks quite slow... Then I implemented one batch query version 7.92s user 33.03s system 15% cpu 4:25.59 total It is same as original My additional patch is below. I investigate call graph (attached rough sketch) and implement batch query in "commit()" and "splitFilesIntoBranches()". In addition, modified "map_in_client" to just search cache value. Could you accept? Subject: [PATCH] git p4: Implement as one batch "p4 where" query to interpret view spec Query for each file is decrese performance. So I implement query to get client file path as one batch query. The query must called before use client path (map_in_client() ). Result of performance measurement, about 40% speed up Signed-off-by: KazukiSaitoh <ksaitoh560@xxxxxxxxx> --- git-p4.py | 70 ++++++++++++++++++++++++++++++++++++++++++++++----------------- 1 file changed, 51 insertions(+), 19 deletions(-) diff --git a/git-p4.py b/git-p4.py index 40522f7..8cbee24 100755 --- a/git-p4.py +++ b/git-p4.py @@ -1849,37 +1849,46 @@ class View(object): if not exclude: self.mappings.append(depot_side) - def map_in_client(self, depot_path): - """Return the relative location in the client where this - depot file should live. Returns "" if the file should - not be mapped in the client.""" + def convert_client_path(self, clientFile): + # chop off //client/ part to make it relative + if not clientFile.startswith(self.client_prefix): + die("No prefix '%s' on clientFile '%s'" % + (self.client_prefix, clientFile)) + return clientFile[len(self.client_prefix):] - if depot_path in self.client_spec_path_cache: - return self.client_spec_path_cache[depot_path] + def update_client_spec_path_cache(self, files): + fileArgs = [f for f in files if f not in self.client_spec_path_cache] - where_result = p4CmdList(['where', depot_path]) - if len(where_result) == 0: - die("No result from 'p4 where %s'" % depot_path) - client_path = "" + if len(fileArgs) == 0: + return # All files in cache + + where_result = p4CmdList(["-x", "-", "where"], stdin=fileArgs) for res in where_result: if "code" in res and res["code"] == "error": # assume error is "... file(s) not in client view" - client_path = "" continue if "clientFile" not in res: die("No clientFile from 'p4 where %s'" % depot_path) if "unmap" in res: # it will list all of them, but only one not unmap-ped continue - # chop off //client/ part to make it relative - clientFile = res["clientFile"] - if not clientFile.startswith(self.client_prefix): - die("No prefix '%s' on clientFile '%s'" % - (self.client_prefix, clientFile)) - client_path = clientFile[len(self.client_prefix):] + self.client_spec_path_cache[res['depotFile']] = self.convert_client_path(res["clientFile"]) + + # not found files or unmap files set to "" + for depotFile in fileArgs: + if depotFile not in self.client_spec_path_cache: + self.client_spec_path_cache[depotFile] = "" + + def map_in_client(self, depot_path): + """Return the relative location in the client where this + depot file should live. Returns "" if the file should + not be mapped in the client.""" + + if depot_path in self.client_spec_path_cache: + return self.client_spec_path_cache[depot_path] - self.client_spec_path_cache[depot_path] = client_path - return client_path + die( "Error: %s is not found in client spec path" % depot_path ) + return "" class P4Sync(Command, P4UserMap): delete_actions = ( "delete", "move/delete", "purge" ) @@ -2006,6 +2015,22 @@ class P4Sync(Command, P4UserMap): """Look at each depotFile in the commit to figure out to what branch it belongs.""" + # create file list and get client paths by one batch "p4 where" query + if self.clientSpecDirs: + fnum = 0 + file_list = [] + while commit.has_key("depotFile%s" % fnum): + path = commit["depotFile%s" % fnum] + found = [p for p in self.depotPaths + if p4PathStartsWith(path, p)] + if not found: + fnum = fnum + 1 + continue + + file_list.append(path) + fnum = fnum + 1 + self.clientSpecDirs.update_client_spec_path_cache(file_list) + branches = {} fnum = 0 while commit.has_key("depotFile%s" % fnum): @@ -2255,6 +2280,13 @@ class P4Sync(Command, P4UserMap): else: sys.stderr.write("Ignoring file outside of prefix: %s\n" % f['path']) + # get client paths by one batch "p4 where" query + if self.clientSpecDirs: + file_list = [] + for f in files: + file_list.append(f['path']) + self.clientSpecDirs.update_client_spec_path_cache(file_list) + self.gitStream.write("commit %s\n" % branch) # gitStream.write("mark :%s\n" % details["change"]) self.committedChanges.add(int(details["change"])) -- 1.8.4-rc2
Attachment:
rough sketch_of_call_graph.png
Description: PNG image