From 3911dd670c34a54ea3ddaea0e5859b4a32d5a12d Mon Sep 17 00:00:00 2001 From: "Eli C. Lowry" <83078660+Enkidu93@users.noreply.github.com> Date: Tue, 16 Jul 2024 15:08:09 -0400 Subject: [PATCH] Extend manual test to process multiple projects including zipped projects (#227) * Extend manual test to process multiple projects including zipped projects * Put ignore back * Add comment with testing instructions --------- Co-authored-by: John Lambert --- .../Corpora/UsfmManualTests.cs | 112 +++++++++++++----- 1 file changed, 82 insertions(+), 30 deletions(-) diff --git a/tests/SIL.Machine.Tests/Corpora/UsfmManualTests.cs b/tests/SIL.Machine.Tests/Corpora/UsfmManualTests.cs index f0b636cfb..6d81ae0b2 100644 --- a/tests/SIL.Machine.Tests/Corpora/UsfmManualTests.cs +++ b/tests/SIL.Machine.Tests/Corpora/UsfmManualTests.cs @@ -1,4 +1,5 @@ -using System.Text.Json; +using System.IO.Compression; +using System.Text.Json; using NUnit.Framework; namespace SIL.Machine.Corpora; @@ -66,40 +67,91 @@ public record PretranslationDto [Test] [Ignore("This is for manual testing only. Remove this tag to run the test.")] + /* + In order to run this test on specific projects, place the Paratext projects or Paratext project zips in the Corpora/TestData/project/ folder. + If only testing one project, you can instead place the project in the Corpora/TestData/ folder and rename it to "project" + */ public async Task CreateUsfmFile() { - FileParatextProjectSettingsParser parser = new(ParatextProjectPath); - ParatextProjectSettings settings = parser.Parse(); + async Task GetUsfmAsync(string projectPath) + { + ParatextProjectSettingsParserBase parser; + ZipArchive? projectArchive = null; + try + { + projectArchive = ZipFile.Open(projectPath, ZipArchiveMode.Read); + parser = new ZipParatextProjectSettingsParser(projectArchive); + } + catch (UnauthorizedAccessException) + { + parser = new FileParatextProjectSettingsParser(projectPath); + } + ParatextProjectSettings settings = parser.Parse(); - // Read text from pretranslations file - using Stream pretranslationStream = File.OpenRead(PretranslationPath); - (IReadOnlyList, string)[] pretranslations = await JsonSerializer - .DeserializeAsyncEnumerable( - pretranslationStream, - new JsonSerializerOptions { PropertyNamingPolicy = JsonNamingPolicy.CamelCase } - ) - .Select(p => - ( - (IReadOnlyList)( - p?.Refs.Select(r => ScriptureRef.Parse(r, settings.Versification).ToRelaxed()).ToArray() ?? [] - ), - p?.Translation ?? "" + // Read text from pretranslations file + using Stream pretranslationStream = File.OpenRead(PretranslationPath); + (IReadOnlyList, string)[] pretranslations = await JsonSerializer + .DeserializeAsyncEnumerable( + pretranslationStream, + new JsonSerializerOptions { PropertyNamingPolicy = JsonNamingPolicy.CamelCase } ) - ) - .ToArrayAsync(); - - foreach ( - string sfmFileName in Directory.EnumerateFiles( - ParatextProjectPath, - $"{settings.FileNamePrefix}*{settings.FileNameSuffix}" - ) - ) + .Select(p => + ( + (IReadOnlyList)( + p?.Refs.Select(r => ScriptureRef.Parse(r, settings.Versification).ToRelaxed()).ToArray() + ?? [] + ), + p?.Translation ?? "" + ) + ) + .ToArrayAsync(); + List sfmTexts = []; + if (projectArchive == null) + { + sfmTexts = ( + await Task.WhenAll( + Directory + .EnumerateFiles(projectPath, $"{settings.FileNamePrefix}*{settings.FileNameSuffix}") + .Select(async sfmFileName => await File.ReadAllTextAsync(sfmFileName)) + ) + ).ToList(); + } + else + { + sfmTexts = projectArchive + .Entries.Where(e => + e.Name.StartsWith(settings.FileNamePrefix) && e.Name.EndsWith(settings.FileNameSuffix) + ) + .Select(e => + { + string contents; + using (var sr = new StreamReader(e.Open())) + { + contents = sr.ReadToEnd(); + } + return contents; + }) + .ToList(); + } + foreach (string usfm in sfmTexts) + { + var updater = new UsfmTextUpdater(pretranslations, stripAllText: true, preferExistingText: true); + UsfmParser.Parse(usfm, updater, settings.Stylesheet, settings.Versification); + string newUsfm = updater.GetUsfm(settings.Stylesheet); + Assert.That(newUsfm, Is.Not.Null); + } + } + if (!File.Exists(Path.Combine(ParatextProjectPath, "Settings.xml"))) { - var updater = new UsfmTextUpdater(pretranslations, stripAllText: true, preferExistingText: true); - string usfm = await File.ReadAllTextAsync(sfmFileName); - UsfmParser.Parse(usfm, updater, settings.Stylesheet, settings.Versification); - string newUsfm = updater.GetUsfm(settings.Stylesheet); - Assert.That(newUsfm, Is.Not.Null); + Assert.Multiple(() => + { + foreach (string subdir in Directory.EnumerateFiles(ParatextProjectPath)) + Assert.DoesNotThrowAsync(async () => await GetUsfmAsync(subdir), $"Failed to parse {subdir}"); + }); + } + else + { + await GetUsfmAsync(ParatextProjectPath); } } }