Search Text From PDF - Salesforce
PDF Search Text sample in Salesforce demonstrating ‘Search Text From PDF’
PDFTextSearch.cls
public class PDFTextSearch {
String API_KEY = 'YOUR_PDF_CO_API_KEY_HERE';
String endPointUrl = 'https://api.pdf.co/v1/pdf/find';
public void searchPdfText() {
try {
String jsonBody = '{ "async": "false", "encrypt": "false", "url": "https://pdfco-test-files.s3.us-west-2.amazonaws.com/pdf-to-text/sample.pdf", "searchString": "Invoice Date \\d+/\\d+/\\d+", "regexSearch": "true", "name": "output", "pages": "0-", "inline": "true", "wordMatchingMode": "", "password": "" }';
Http http = new Http();
HttpRequest request = new HttpRequest();
request.setHeader('x-api-key', API_KEY);
request.setEndpoint(endPointUrl);
request.setHeader('Content-Type', 'application/json');
request.setMethod('POST');
request.setBody(jsonBody);
HttpResponse response = http.send(request);
if(response.getStatusCode() == 200) {
System.debug('PDF Text Search: ' + response.getBody());
} else {
System.debug('Error Response ' + response.getBody());
System.Debug(' Status ' + response.getStatus());
System.Debug(' Status Code' + response.getStatusCode());
System.Debug(' Response String' + response.toString());
}
} catch (Exception ex) {
String errorBody = 'Message: ' + ex.getMessage() + ' -- Cause: ' + ex.getCause() + ' -- Stacktrace: ' + ex.getStackTraceString();
System.Debug(errorBody);
}
}
}
PDFTextSearchTest.cls
@isTest
private class PDFTextSearchTest {
static testMethod void testSearchPdfText() {
Test.startTest();
Test.setMock(HttpCalloutMock.class, new PDFTextSearchTest.PDFTextSearchMock());
PDFTextSearch pdfTextSearch = new PDFTextSearch();
pdfTextSearch.searchPdfText();
Test.stopTest();
}
public class PDFTextSearchMock implements HttpCalloutMock {
public HttpResponse respond(HTTPRequest req) {
HttpResponse res = new HttpResponse();
String testBody = '{"success":true,"foundTextItems":[{"text":"Invoice Date 12/04/2019","page":0,"x":30,"y":25,"width":200,"height":15}],"error":false,"status":200}';
res.setHeader('Content-Type', 'application/json');
res.setBody(testBody);
res.setStatusCode(200);
return res;
}
}
}
PDF.co Web API: the Web API with a set of tools for documents manipulation, data conversion, data extraction, splitting and merging of documents. Includes image recognition, built-in OCR, barcode generation and barcode decoders to decode bar codes from scans, pictures and pdf.
Download Source Code (.zip)
return to the previous page explore PDF Search Text endpoint
Copyright © 2016 - 2023 PDF.co