#483 make skip missing fonts even more resilient to nonsense files

This commit is contained in:
Eliot Jones 2022-12-11 16:18:09 -05:00
parent 2aed996319
commit c8874c5984
6 changed files with 64 additions and 11 deletions

View File

@ -0,0 +1,34 @@
namespace UglyToad.PdfPig.Fonts
{
using System;
using System.Runtime.Serialization;
/// <summary>
/// Thrown when a PDF contains an invalid compressed data stream.
/// </summary>
[Serializable]
public class CorruptCompressedDataException : Exception
{
/// <inheritdoc />
public CorruptCompressedDataException()
{
}
/// <inheritdoc />
public CorruptCompressedDataException(string message) : base(message)
{
}
/// <inheritdoc />
public CorruptCompressedDataException(string message, Exception inner) : base(message, inner)
{
}
/// <inheritdoc />
protected CorruptCompressedDataException(
SerializationInfo info,
StreamingContext context) : base(info, context)
{
}
}
}

View File

@ -6,7 +6,7 @@
internal interface IResourceStore internal interface IResourceStore
{ {
void LoadResourceDictionary(DictionaryToken resourceDictionary); void LoadResourceDictionary(DictionaryToken resourceDictionary, InternalParsingOptions parsingOptions);
/// <summary> /// <summary>
/// Remove any named resources and associated state for the last resource dictionary loaded. /// Remove any named resources and associated state for the last resource dictionary loaded.

View File

@ -33,7 +33,7 @@
this.fontFactory = fontFactory; this.fontFactory = fontFactory;
} }
public void LoadResourceDictionary(DictionaryToken resourceDictionary) public void LoadResourceDictionary(DictionaryToken resourceDictionary, InternalParsingOptions parsingOptions)
{ {
lastLoadedFont = (null, null); lastLoadedFont = (null, null);
@ -43,7 +43,7 @@
{ {
var fontDictionary = DirectObjectFinder.Get<DictionaryToken>(fontBase, scanner); var fontDictionary = DirectObjectFinder.Get<DictionaryToken>(fontBase, scanner);
LoadFontDictionary(fontDictionary); LoadFontDictionary(fontDictionary, parsingOptions);
} }
if (resourceDictionary.TryGet(NameToken.Xobject, out var xobjectBase)) if (resourceDictionary.TryGet(NameToken.Xobject, out var xobjectBase))
@ -132,7 +132,7 @@
currentResourceState.Pop(); currentResourceState.Pop();
} }
private void LoadFontDictionary(DictionaryToken fontDictionary) private void LoadFontDictionary(DictionaryToken fontDictionary, InternalParsingOptions parsingOptions)
{ {
lastLoadedFont = (null, null); lastLoadedFont = (null, null);
@ -157,7 +157,18 @@
continue; continue;
} }
loadedFonts[reference] = fontFactory.Get(fontObject); try
{
loadedFonts[reference] = fontFactory.Get(fontObject);
}
catch
{
if (!parsingOptions.SkipMissingFonts)
{
throw;
}
}
} }
else if (pair.Value is DictionaryToken fd) else if (pair.Value is DictionaryToken fd)
{ {

View File

@ -1,5 +1,6 @@
namespace UglyToad.PdfPig.Filters namespace UglyToad.PdfPig.Filters
{ {
using Fonts;
using System; using System;
using System.Collections.Generic; using System.Collections.Generic;
using System.IO; using System.IO;
@ -79,10 +80,17 @@
memoryStream.ReadByte(); memoryStream.ReadByte();
memoryStream.ReadByte(); memoryStream.ReadByte();
using (var deflate = new DeflateStream(memoryStream, CompressionMode.Decompress)) try
{ {
deflate.CopyTo(output); using (var deflate = new DeflateStream(memoryStream, CompressionMode.Decompress))
return output.ToArray(); {
deflate.CopyTo(output);
return output.ToArray();
}
}
catch (InvalidDataException ex)
{
throw new CorruptCompressedDataException("Invalid Flate compressed stream encountered", ex);
} }
} }
} }

View File

@ -479,7 +479,7 @@
var hasResources = formStream.StreamDictionary.TryGet<DictionaryToken>(NameToken.Resources, pdfScanner, out var formResources); var hasResources = formStream.StreamDictionary.TryGet<DictionaryToken>(NameToken.Resources, pdfScanner, out var formResources);
if (hasResources) if (hasResources)
{ {
resourceStore.LoadResourceDictionary(formResources); resourceStore.LoadResourceDictionary(formResources, parsingOptions);
} }
// 1. Save current state. // 1. Save current state.

View File

@ -63,13 +63,13 @@
{ {
var resource = pageTreeMembers.ParentResources.Dequeue(); var resource = pageTreeMembers.ParentResources.Dequeue();
resourceStore.LoadResourceDictionary(resource); resourceStore.LoadResourceDictionary(resource, parsingOptions);
stackDepth++; stackDepth++;
} }
if (dictionary.TryGet(NameToken.Resources, pdfScanner, out DictionaryToken resources)) if (dictionary.TryGet(NameToken.Resources, pdfScanner, out DictionaryToken resources))
{ {
resourceStore.LoadResourceDictionary(resources); resourceStore.LoadResourceDictionary(resources, parsingOptions);
stackDepth++; stackDepth++;
} }