[ 
https://issues.apache.org/jira/browse/TIKA-3446?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17460262#comment-17460262
 ] 

Hudson commented on TIKA-3446:
------------------------------

UNSTABLE: Integrated in Jenkins build Tika » tika-branch1x-jdk8 #153 (See 
[https://ci-builds.apache.org/job/Tika/job/tika-branch1x-jdk8/153/])
port the TIKA-3446 work from the 2.x branch. (#465) (github: 
[https://github.com/apache/tika/commit/b2e442ddcb3f9c870bed1daf9827413423eba219])
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/UuidUtils.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/IProperty.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNoteDocument.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/EncryptionObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/unsigned/UShort.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/IndentUtil.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/JCIDObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/NoData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectParseErrorException.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/ZipHeader.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/RevisionStoreObjectGroup.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StorageManifestSchemaGUID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/RevisionManifestRootDeclare.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/exception/DataElementParseErrorException.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/AlternativePackaging.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StorageIndexManifestMapping.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileNodePtrBackPush.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNotePtr.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/CellManifestCurrentRevision.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectHeaderStart.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/BinaryItem.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/unsigned/ULong.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupObjectData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/PropertySet.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/BitConverter.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/DataElementHash.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/chunking/SimpleChunking.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/Bit.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupObjectDataBLOBReference.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/space/ObjectSpaceObjectStreamOfOSIDs.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/AdapterHelper.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/DataNodeObjectData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/JCID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/chunking/ChunkingFactory.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/PropertySet.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupMetadataDeclarations.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/DataElementPackage.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/JCIDPropertySetTypeEnum.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/RevisionManifestDataElementData.java
* (edit) 
tika-parsers/src/test/java/org/apache/tika/parser/microsoft/onenote/OneNoteParserTest.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/unsigned/UInteger.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNoteTreeWalker.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/IntermediateNodeObject.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/ObjectSpaceObjectPropSet.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectHeaderStart16bit.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/ExtendedGUID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/RevisionManifest.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectHeaderEnd.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/PropertySetObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/chunking/AbstractChunking.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/PropertyValue.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/LittleEndianBitConverter.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/TwoBytesOfData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/BitReader.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/RevisionManifestObjectGroupReferences.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectHeaderEnd8bit.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/RevisionManifest.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/CellIDArray.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileNode.java
* (add) 
tika-parsers/src/test/resources/test-documents/testOneNoteFromOffice365-2.one
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/MSOneStorePackage.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/DataElement.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectTypeHeaderStart.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/SequenceNumberGenerator.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/Compact64bitInt.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/DataElementType.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/chunking/ChunkingMethod.java
* (add) 
tika-parsers/src/test/resources/test-documents/testOneNote2007OrEarlier.one
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StorageIndexRevisionMapping.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StorageManifestRootDeclare.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNoteLegacyDumpStrings.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNotePropertyEnum.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupMetadata.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/IFSSHTTPBSerializable.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNoteParser.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/FourBytesOfData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/space/ObjectSpaceObjectStreamHeader.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/SignatureObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectHeaderEnd16bit.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/BasicObject.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileNodeList.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectHeaderStart32bit.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileChunkReference.java
* (delete) 
tika-parsers/src/test/resources/test-documents/testOneNote2007OrEarlier2.one
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileDataStoreObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/ExGUIDArray.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/chunking/ZipFilesChunking.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/RootObjectReference.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/ObjectSpaceObjectStreamOfOIDsOSIDsOrContextIDs.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StorageManifestDataElementData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/space/ObjectSpaceObjectStreamOfContextIDs.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/CompactID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/HeaderCell.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/PrtArrayOfPropertyValues.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/space/ObjectSpaceObjectPropSet.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/RevisionStoreObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/GuidUtil.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StorageIndexDataElementData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/LeafNodeObject.java
* (delete) 
tika-parsers/src/test/resources/test-documents/testOneNoteNonAscii.one
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/unsigned/UByte.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/PropertyType.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/PropertyIDType.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/DataSizeObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupDataElementData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/BitWriter.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/CellManifestDataElementData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StorageIndexCellMapping.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/RequestTypes.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/PrtFourBytesOfLengthFollowedByData.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNotePropertyId.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileNodeListHeader.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/CellID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/ArrayNumber.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/DataElementData.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FndStructureConstants.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/unsigned/UNumber.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/ExGuid.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/StreamObjectTypeHeaderEnd.java
* (delete) 
tika-parsers/src/test/resources/test-documents/testOneNote2007OrEarlier1.one
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileNodeUnion.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/DataElementUtils.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/GUID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/EightBytesOfData.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/Revision.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupObjectDeclare.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/NodeObject.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/FileNodePtr.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/SerialNumber.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/FileDataObject.java
* (add) 
tika-parsers/src/test/resources/test-documents/testOneNoteFromOffice365.one
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNoteDirectFileResource.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/Error.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/ObjectDeclarationWithRefCount.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNoteTreeWalkerOptions.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupDeclarations.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/DataHashObject.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/property/OneByteOfData.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/unsigned/UMath.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/chunking/RDCAnalysisChunking.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/CompactID.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/Int24.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/JCID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/basic/PropertyID.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/util/ByteUtil.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/ObjectDeclarationWithRefCountBody.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/space/ObjectSpaceObjectStreamOfOIDs.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/streamobj/ObjectGroupObjectBLOBDataDeclaration.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/MSOneStoreParser.java
* (add) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/fsshttpb/unsigned/Unsigned.java
* (edit) 
tika-parsers/src/main/java/org/apache/tika/parser/microsoft/onenote/OneNoteHeader.java


> OneNote - look into adding support for OneNote 365 documents
> ------------------------------------------------------------
>
>                 Key: TIKA-3446
>                 URL: https://issues.apache.org/jira/browse/TIKA-3446
>             Project: Tika
>          Issue Type: New Feature
>          Components: parser
>    Affects Versions: 1.27
>            Reporter: Nicholas DiPiazza
>            Assignee: Nicholas DiPiazza
>            Priority: Major
>
> While doing some parsing of OneNote documents, I was investigating a slew of 
> them that did not seem to parse very well. 
> When I did some digging, I found out that these documents were generated from 
> SharePoint Online. 
> I had hoped that OneNote documents generated from SharePoint Online would 
> just be the same as OnPrem OneNote documents from 2016, 2019 etc. 
> But turns out this is NOT the case. 
> I checked out the Microsoft specification MS-ONESTORE and found that the 
> documents do not match the specifications that are published. 
> Opened a community post: [Looking for the MS spec for OneNote 365 version - 
> Microsoft 
> Q&A|https://docs.microsoft.com/en-us/answers/questions/436943/looking-for-the-ms-spec-for-onenote-365-version-1.html]
> And also opened an internal ticket with Microsoft. 
> They will be responding soon with an analysis of my issue and we'll see if 
> there is anything we can do. 



--
This message was sent by Atlassian Jira
(v8.20.1#820001)

Reply via email to