Skip to content

Commit

Permalink
Refactored YAML parsing
Browse files Browse the repository at this point in the history
- Replaced custom string parsing with YamlDotNet deserializer
- Added test for malformed YAML
  • Loading branch information
jasonjoh committed Jun 6, 2024
1 parent a33a7b4 commit 59f67ac
Show file tree
Hide file tree
Showing 3 changed files with 68 additions and 37 deletions.
3 changes: 3 additions & 0 deletions .vscode/settings.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
{
"dotnet.defaultSolution": "ApiDoctor.sln"
}
31 changes: 31 additions & 0 deletions ApiDoctor.Validation.UnitTests/YamlParserTests.cs
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@

namespace ApiDoctor.Validation.UnitTests
{
using System.Linq;
using ApiDoctor.Validation;
using ApiDoctor.Validation.Error;
using NUnit.Framework;
Expand All @@ -41,6 +42,18 @@ public class YamlParserTests
toc.keywords:
- foo
- bar
";

// Missing closing double-quote on title property
private static readonly string malformedYaml = @"title: ""Define the /me as singleton
description: ""These are things I had to add in the docs to make sure the Markdown-Scanner""
ms.localizationpriority: medium
author: """"
ms.prod: """"
doc_type: conceptualPageType
toc.keywords:
- foo
- bar
";

[Test]
Expand All @@ -56,5 +69,23 @@ public void YamlWithMultiLineArrayParses()
// Assert
Assert.That(!issues.Issues.WereErrors());
}

[Test]
public void MalformedYamlGeneratesError()
{
// Arrange
_ = new DocSet();
var issues = new IssueLogger();

// Act
DocFile.ParseYamlMetadata(malformedYaml, issues);

// Assert
Assert.That(issues.Issues.WereErrors());
var error = issues.Issues.FirstOrDefault();
Assert.That(error != null);
Assert.That(error.IsError);
Assert.That(error.Message == "Incorrect YAML header format");
}
}
}
71 changes: 34 additions & 37 deletions ApiDoctor.Validation/DocFile.cs
Original file line number Diff line number Diff line change
@@ -1,25 +1,25 @@
/*
* API Doctor
* Copyright (c) Microsoft Corporation
* All rights reserved.
*
* All rights reserved.
*
* MIT License
*
* Permission is hereby granted, free of charge, to any person obtaining a copy of
* this software and associated documentation files (the ""Software""), to deal in
* the Software without restriction, including without limitation the rights to use,
*
* Permission is hereby granted, free of charge, to any person obtaining a copy of
* this software and associated documentation files (the ""Software""), to deal in
* the Software without restriction, including without limitation the rights to use,
* copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the
* Software, and to permit persons to whom the Software is furnished to do so,
* Software, and to permit persons to whom the Software is furnished to do so,
* subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in all
*
* The above copyright notice and this permission notice shall be included in all
* copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED *AS IS*, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
* PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
* HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
* OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
*
* THE SOFTWARE IS PROVIDED *AS IS*, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
* PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
* HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
* OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/

Expand All @@ -30,12 +30,13 @@ namespace ApiDoctor.Validation
using System.Diagnostics;
using System.IO;
using System.Linq;
using ApiDoctor.Validation.Config;
using ApiDoctor.Validation.Error;
using ApiDoctor.Validation.TableSpec;
using Tags;
using MarkdownDeep;
using Newtonsoft.Json;
using ApiDoctor.Validation.Config;
using YamlDotNet.Serialization;

/// <summary>
/// A documentation file that may contain one more resources or API methods
Expand All @@ -50,6 +51,8 @@ public partial class DocFile
private readonly List<EnumerationDefinition> enums = new List<EnumerationDefinition>();
private readonly List<string> bookmarks = new List<string>();

private static readonly IDeserializer yamlDeserializer = new DeserializerBuilder().Build();

protected bool HasScanRun;
protected string BasePath;

Expand Down Expand Up @@ -389,29 +392,23 @@ internal static (string YamlFrontMatter, string ProcessedContent) ParseAndRemove

internal static void ParseYamlMetadata(string yamlMetadata, IssueLogger issues)
{
Dictionary<string, string> dictionary = new Dictionary<string, string>();
string[] items = yamlMetadata.Split(new[] { "\r\n", "\n" }, StringSplitOptions.RemoveEmptyEntries);
foreach (string item in items)
Dictionary<string, object> dictionary = null;
try
{
try
{
string[] keyValue = item.Split(':');
dictionary.Add(keyValue[0].Trim(), keyValue[1].Trim());
}
catch (Exception)
{
issues.Error(ValidationErrorCode.IncorrectYamlHeaderFormat, $"Incorrect YAML header format after `{dictionary.Keys.Last()}`");
}
dictionary = yamlDeserializer.Deserialize<Dictionary<string, object>>(yamlMetadata);
}
catch (Exception)
{
issues.Error(ValidationErrorCode.IncorrectYamlHeaderFormat, "Incorrect YAML header format");
}

List<string> missingHeaders = new List<string>();
foreach (var header in DocSet.SchemaConfig.RequiredYamlHeaders)
{
string value;
if (dictionary.TryGetValue(header, out value))
if (dictionary.TryGetValue(header, out object value) && value is string stringValue)
{
value = value.Replace("\"", string.Empty);
if (string.IsNullOrWhiteSpace(value))
stringValue = stringValue.Replace("\"", string.Empty);
if (string.IsNullOrWhiteSpace(stringValue))
{
issues.Warning(ValidationErrorCode.RequiredYamlHeaderMissing, $"Missing value for YAML header: {header}");
}
Expand Down Expand Up @@ -732,7 +729,7 @@ private void CheckDocumentHeaders(List<object> expectedHeaders, IReadOnlyList<Do
while (expectedIndex < expectedHeaders.Count && foundIndex < foundHeaders.Count)
{
var found = foundHeaders[foundIndex];
var result = ValidateDocumentHeader(expectedHeaders, foundHeaders, expectedIndex, foundIndex);
var result = ValidateDocumentHeader(expectedHeaders, foundHeaders, expectedIndex, foundIndex);
var expected = expectedHeaders[expectedIndex] as ExpectedDocumentHeader; // at this point, if header was conditional, the condition has been removed
switch (result)
{
Expand All @@ -743,7 +740,7 @@ private void CheckDocumentHeaders(List<object> expectedHeaders, IReadOnlyList<Do
//if expecting multiple headers of the same pattern, do not increment expected until last header matching pattern is found
if (!expected.AllowMultiple || (expected.AllowMultiple && foundIndex == foundHeaders.Count))
expectedIndex++;

break;

case DocumentHeaderValidationResult.FoundInWrongCase:
Expand Down Expand Up @@ -890,7 +887,7 @@ private DocumentHeaderValidationResult ValidateDocumentHeader(List<object> expec
private static List<DocumentHeader> FlattenDocumentHeaderHierarchy(IReadOnlyList<object> headers)
{
var mergedHeaders = new List<DocumentHeader>();
foreach (var header in headers)
foreach (var header in headers)
{
if (header is ExpectedDocumentHeader expectedHeader)
{
Expand Down Expand Up @@ -1002,7 +999,7 @@ private void AddHeaderToHierarchy(Stack<DocumentHeader> headerStack, Block block
}

/// <summary>
/// Validates code snippets tab section.
/// Validates code snippets tab section.
/// Checks:
/// - No duplicated tabs
/// - Existence of tab boundary at the end of tab group definition
Expand Down Expand Up @@ -1224,7 +1221,7 @@ private void PostProcessEnums(List<EnumerationDefinition> foundEnums, List<Table
// add all the enum values
this.enums.AddRange(foundEnums.Where(e => !string.IsNullOrEmpty(e.MemberName) && !string.IsNullOrEmpty(e.TypeName)));

// if we thought it was a table of type EnumerationValues, it probably holds enum values.
// if we thought it was a table of type EnumerationValues, it probably holds enum values.
// throw error if member name is null which could mean a wrong column name
foreach (var enumType in foundEnums.Where(e => string.IsNullOrEmpty(e.MemberName) && !string.IsNullOrEmpty(e.TypeName))
.Select(x => new { x.TypeName, x.Namespace }).Distinct())
Expand Down

0 comments on commit 59f67ac

Please sign in to comment.