-
Notifications
You must be signed in to change notification settings - Fork 1.3k
Add MicrosoftOfficeFilesParser independent publisher connector by Steven Soe #3936
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
base: dev
Are you sure you want to change the base?
Changes from all commits
69a4cc0
e3507c3
95d49ed
095500f
fde4abe
ed75c5d
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,43 @@ | ||
# MicrosoftOffice Files Parser Connector | ||
|
||
Custom connector for parsing Microsoft Word and Excel documents by submitting base64-encoded file content. Designed for use with Power Automate, Power Apps, and Azure Logic Apps to enable easy document content extraction. | ||
|
||
## Publisher: Steven Soe | ||
Certified Connector Owner | ||
|
||
## Prerequisites | ||
No special licenses or plans are required. The connector does **not** require authentication. Suitable for users with access to Power Automate, Power Apps, or Azure Logic Apps. | ||
|
||
## Supported Operations | ||
|
||
### Parse Word Document | ||
Accepts base64-encoded Word document content and returns the extracted text content. | ||
|
||
### Parse Excel Spreadsheet | ||
Accepts base64-encoded Excel file content and returns worksheet names along with the parsed worksheet data as 2D arrays. | ||
|
||
## Obtaining Credentials | ||
This connector does **not** require authentication or credentials. | ||
|
||
## Getting Started | ||
To use the connector, POST a JSON payload containing the base64-encoded file content to the respective endpoint for Word or Excel parsing. Ensure the content type and filename (for Excel) are provided. | ||
|
||
## Known Issues and Limitations | ||
- The connector expects base64 encoding for the file content. | ||
- The `$filename` parameter is required for Excel files and must include the file extension. | ||
- The connector does **not** store, retain, or use any submitted data. | ||
- No authentication is required; users should exercise caution when sharing sensitive data through flows using this connector. | ||
|
||
## Frequently Asked Questions | ||
|
||
### Does this connector store my data? | ||
No, the connector does not store, retain, or use any submitted file content. | ||
|
||
### Is authentication required? | ||
No, this connector does not require any authentication. | ||
|
||
## Deployment Instructions | ||
Place the connector files (`swagger.yaml`, `manifest.json`, `README.md`, `icon.png`) in your folder structure and import the custom connector into your Power Platform environment via the Power Automate or Power Apps portal. | ||
|
||
## Support | ||
For questions or support, contact [[email protected]](mailto:[email protected]). |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,167 @@ | ||
{ | ||
"swagger": "2.0", | ||
"info": { | ||
"version": "1.0", | ||
"title": "MicrosoftOffice Files Parser", | ||
"description": "Custom connector for parsing Word and Excel documents.", | ||
"contact": { | ||
"name": "Steven Soe", | ||
"url": "https://github.com/ssdevkit", | ||
"email": "[email protected]" | ||
} | ||
}, | ||
"host": "ssnotes.azurewebsites.net", | ||
"basePath": "/", | ||
"schemes": [ | ||
"https" | ||
], | ||
"consumes": [ | ||
"application/json" | ||
], | ||
"produces": [ | ||
"application/json" | ||
], | ||
"paths": { | ||
"/apps/parser/word.php": { | ||
"post": { | ||
"summary": "Parse Word Document", | ||
"description": "Parses a Word document from base64 content.", | ||
"operationId": "Word_Document", | ||
"parameters": [ | ||
{ | ||
"name": "body", | ||
"in": "body", | ||
"required": true, | ||
"schema": { | ||
"type": "object", | ||
"properties": { | ||
"$content-type": { | ||
"type": "string", | ||
"description": "Content-Type of the document" | ||
}, | ||
"base64$content": { | ||
"type": "string", | ||
"description": "Base64 encoded Word document content" | ||
} | ||
}, | ||
"required": [ | ||
"$content-type", | ||
"base64$content" | ||
] | ||
} | ||
} | ||
], | ||
"responses": { | ||
"200": { | ||
"description": "Text extracted successfully", | ||
"schema": { | ||
"type": "object", | ||
"properties": { | ||
"message": { | ||
"type": "string", | ||
"example": "Text extracted successfully", | ||
"description": "Result message from the API" | ||
}, | ||
"text": { | ||
"type": "string", | ||
"example": "Cloud", | ||
"description": "Extracted text content" | ||
} | ||
}, | ||
"required": [ | ||
"message", | ||
"text" | ||
] | ||
} | ||
} | ||
} | ||
} | ||
}, | ||
"/apps/parser/excel.php": { | ||
"post": { | ||
"summary": "Excel_Spreadsheet", | ||
"description": "Excel_Spreadsheet", | ||
"operationId": "Excel_Spreadsheet", | ||
"parameters": [ | ||
{ | ||
"name": "body", | ||
"in": "body", | ||
"required": true, | ||
"schema": { | ||
"type": "object", | ||
"properties": { | ||
"$content-type": { | ||
"type": "string", | ||
"description": "content-type" | ||
}, | ||
"$filename": { | ||
"type": "string", | ||
"description": "filename with extension" | ||
}, | ||
"base64$content": { | ||
"type": "string", | ||
"description": "base64$content" | ||
} | ||
}, | ||
"required": [ | ||
"base64$content", | ||
"$content-type", | ||
"$filename" | ||
] | ||
} | ||
} | ||
], | ||
"responses": { | ||
"200": { | ||
"description": "Excel parsing response containing worksheet data in arrays", | ||
"schema": { | ||
"type": "object", | ||
"properties": { | ||
"Worksheets": { | ||
"type": "array", | ||
"description": "List of all sheet names in the response", | ||
"items": { | ||
"type": "string" | ||
} | ||
} | ||
}, | ||
"required": [ | ||
"Worksheets" | ||
], | ||
"additionalProperties": { | ||
"type": "array", | ||
"description": "2D array of strings representing sheet data rows and columns", | ||
"items": { | ||
"type": "array", | ||
"items": { | ||
"type": "string" | ||
} | ||
} | ||
} | ||
} | ||
} | ||
} | ||
} | ||
} | ||
}, | ||
"definitions": {}, | ||
"parameters": {}, | ||
"responses": {}, | ||
"securityDefinitions": {}, | ||
"security": [], | ||
"tags": [], | ||
"x-ms-connector-metadata": [ | ||
{ | ||
"propertyName": "Website", | ||
"propertyValue": "https://github.com/ssdevkit/Microsoft-PowerPlatform-Connector/tree/main/MicrosoftOffice%20Files%20Parser" | ||
}, | ||
{ | ||
"propertyName": "Privacy policy", | ||
"propertyValue": "https://raw.githubusercontent.com/ssdevkit/Microsoft-PowerPlatform-Connector/main/MicrosoftOffice%20Files%20Parser/privacy.md" | ||
}, | ||
{ | ||
"propertyName": "Categories", | ||
"propertyValue": "Document Processing, Excel, Word" | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Please fix the below error: ##[error]The connector category is invalid. Available categories are: [AI, Business Management, Business Intelligence, Collaboration, Commerce, Communication, Content and Files, Finance, Data, Human Resources, Internet of Things, IT Operations, Lifestyle and Entertainment, Marketing, Productivity, Sales and CRM, Security, Social Media, Website]. ValuePath: /x-ms-connector-metadata/2/propertyValue |
||
} | ||
] | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,9 @@ | ||
{ | ||
"properties": { | ||
"connectionParameters": {}, | ||
"iconBrandColor": "#0078D4", | ||
"capabilities": [], | ||
"publisher": "Steven Soe", | ||
"stackOwner": "Steven Soe" | ||
} | ||
} |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Please remove reserved word "Microsoft".