URIReader
This commit is contained in:
parent
7f8013fef2
commit
d8fb22a71f
3 changed files with 460 additions and 0 deletions
|
@ -139,6 +139,7 @@ set(libHeaders
|
|||
lib/ebml_socketglue.h
|
||||
lib/websocket.h
|
||||
lib/url.h
|
||||
lib/urireader.h
|
||||
)
|
||||
|
||||
########################################
|
||||
|
@ -183,6 +184,7 @@ add_library (mist
|
|||
lib/ebml_socketglue.cpp
|
||||
lib/websocket.cpp
|
||||
lib/url.cpp
|
||||
lib/urireader.cpp
|
||||
)
|
||||
if (NOT APPLE)
|
||||
set (LIBRT -lrt)
|
||||
|
|
375
lib/urireader.cpp
Normal file
375
lib/urireader.cpp
Normal file
|
@ -0,0 +1,375 @@
|
|||
#include "defines.h"
|
||||
#include "shared_memory.h"
|
||||
#include "timing.h"
|
||||
#include "urireader.h"
|
||||
#include "util.h"
|
||||
#include <sys/mman.h>
|
||||
#include <sys/stat.h>
|
||||
|
||||
namespace HTTP{
|
||||
|
||||
URIReader::URIReader(){
|
||||
char workDir[512];
|
||||
getcwd(workDir, 512);
|
||||
myURI = HTTP::URL(std::string("file://") + workDir);
|
||||
cbProgress = 0;
|
||||
minLen = 1;
|
||||
maxLen = std::string::npos;
|
||||
startPos = 0;
|
||||
supportRangeRequest = false;
|
||||
endPos = std::string::npos;
|
||||
totalSize = std::string::npos;
|
||||
stateType = URIType::Closed;
|
||||
clearPointer = true;
|
||||
}
|
||||
|
||||
URIReader::URIReader(const HTTP::URL &uri){
|
||||
URIReader();
|
||||
open(uri);
|
||||
}
|
||||
|
||||
URIReader::URIReader(const std::string &reluri){
|
||||
URIReader();
|
||||
open(reluri);
|
||||
}
|
||||
|
||||
bool URIReader::open(const std::string &reluri){return open(myURI.link(reluri));}
|
||||
|
||||
/// Internal callback function, used to buffer data.
|
||||
void URIReader::dataCallback(const char *ptr, size_t size){
|
||||
std::string t = std::string(ptr, size);
|
||||
allData.append(t.c_str(), size);
|
||||
}
|
||||
|
||||
bool URIReader::open(const HTTP::URL &uri){
|
||||
myURI = uri;
|
||||
curPos = 0;
|
||||
|
||||
if (!myURI.protocol.size() || myURI.protocol == "file"){
|
||||
if (!myURI.path.size() || myURI.path == "-"){
|
||||
downer.getSocket().open(-1, fileno(stdin));
|
||||
stateType = URIType::Stream;
|
||||
startPos = 0;
|
||||
|
||||
endPos = std::string::npos;
|
||||
totalSize = std::string::npos;
|
||||
if (!downer.getSocket()){
|
||||
FAIL_MSG("Could not open '%s': %s", myURI.getUrl().c_str(), strerror(errno));
|
||||
stateType = URIType::Closed;
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
}else{
|
||||
//
|
||||
//
|
||||
/// \todo Use ACCESSPERMS instead of 0600?
|
||||
int handle = ::open(myURI.getFilePath().c_str(), O_RDWR, (mode_t)0600);
|
||||
if (handle == -1){
|
||||
FAIL_MSG("opening file: %s failed: %s", myURI.getFilePath().c_str(), strerror(errno));
|
||||
stateType = URIType::Closed;
|
||||
return false;
|
||||
}
|
||||
|
||||
struct stat buffStats;
|
||||
int xRes = fstat(handle, &buffStats);
|
||||
if (xRes < 0){
|
||||
FAIL_MSG("Cheking size of %s failed: %s", myURI.getFilePath().c_str(), strerror(errno));
|
||||
stateType = URIType::Closed;
|
||||
return false;
|
||||
}
|
||||
totalSize = buffStats.st_size;
|
||||
// INFO_MSG("size: %llu", totalSize);
|
||||
|
||||
mapped = (char *)mmap(0, totalSize, PROT_READ | PROT_WRITE, MAP_SHARED, handle, 0);
|
||||
if (mapped == MAP_FAILED){
|
||||
mapped = 0;
|
||||
stateType = URIType::Closed;
|
||||
return false;
|
||||
}
|
||||
startPos = 0;
|
||||
|
||||
stateType = URIType::File;
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
// HTTP, stream or regular download?
|
||||
if (myURI.protocol == "http" || myURI.protocol == "https"){
|
||||
stateType = URIType::HTTP;
|
||||
|
||||
// Send HEAD request to determine range request is supported, and get total length
|
||||
if (!downer.head(myURI)){FAIL_MSG("Error sending HEAD request");}
|
||||
|
||||
std::string header1 = downer.getHeader("Accept-Ranges");
|
||||
supportRangeRequest = (header1.size() > 0);
|
||||
|
||||
header1 = downer.getHeader("Content-Length");
|
||||
totalSize = atoi(header1.c_str());
|
||||
|
||||
// streaming mode when size is unknown
|
||||
if (!supportRangeRequest){
|
||||
downer.getNonBlocking(uri);
|
||||
}else{
|
||||
MEDIUM_MSG("download file with range request: %s, totalsize: %llu", myURI.getUrl().c_str(), totalSize);
|
||||
if (!downer.getRangeNonBlocking(myURI.getUrl(), curPos, 0)){
|
||||
FAIL_MSG("error loading url: %s", myURI.getUrl().c_str());
|
||||
}
|
||||
}
|
||||
|
||||
if (!downer.getSocket()){
|
||||
FAIL_MSG("Could not open '%s': %s", myURI.getUrl().c_str(), strerror(errno));
|
||||
stateType = URIType::Closed;
|
||||
return false;
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
FAIL_MSG("URI type not implemented: %s", myURI.getUrl().c_str());
|
||||
return false;
|
||||
}
|
||||
|
||||
// seek to pos, return true if succeeded.
|
||||
bool URIReader::seek(const uint64_t pos){
|
||||
if (isSeekable()){
|
||||
if (stateType == URIType::File){
|
||||
curPos = pos;
|
||||
return true;
|
||||
}else if (stateType == URIType::HTTP && supportRangeRequest){
|
||||
INFO_MSG("SEEK: RangeRequest to %llu", pos);
|
||||
if (!downer.getRangeNonBlocking(myURI.getUrl(), pos, 0)){
|
||||
FAIL_MSG("error loading request");
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
void URIReader::readAll(size_t (*dataCallback)(const char *data, size_t len)){
|
||||
while (!isEOF()){readSome(dataCallback, 419430);}
|
||||
}
|
||||
|
||||
/// Read all function, with use of callbacks
|
||||
void URIReader::readAll(Util::DataCallback &cb){
|
||||
while (!isEOF()){readSome(1048576, cb);}
|
||||
}
|
||||
|
||||
/// Read all blocking function, which internally uses the Nonblocking function.
|
||||
void URIReader::readAll(char *&dataPtr, size_t &dataLen){
|
||||
size_t s = 0;
|
||||
char *tmp = 0;
|
||||
std::string t;
|
||||
|
||||
allData.allocate(68401307);
|
||||
|
||||
while (!isEOF()){
|
||||
readSome(10046, *this);
|
||||
// readSome(1048576, *this);
|
||||
}
|
||||
dataPtr = allData;
|
||||
dataLen = allData.size();
|
||||
}
|
||||
|
||||
void httpBodyCallback(const char *ptr, size_t size){INFO_MSG("callback");}
|
||||
|
||||
void URIReader::readSome(size_t (*dataCallback)(const char *data, size_t len), size_t wantedLen){
|
||||
/// TODO: Implement
|
||||
}
|
||||
|
||||
// readsome with callback
|
||||
void URIReader::readSome(size_t wantedLen, Util::DataCallback &cb){
|
||||
if (isEOF()){return;}
|
||||
if (stateType == URIType::File){
|
||||
// dataPtr = mapped + curPos;
|
||||
uint64_t dataLen = 0;
|
||||
|
||||
if (wantedLen < totalSize){
|
||||
if ((wantedLen + curPos) > totalSize){
|
||||
dataLen = totalSize - curPos; // restant
|
||||
// INFO_MSG("file curpos: %llu, dataLen: %llu, totalSize: %llu ", curPos, dataLen, totalSize);
|
||||
}else{
|
||||
dataLen = wantedLen;
|
||||
}
|
||||
}else{
|
||||
dataLen = totalSize;
|
||||
}
|
||||
|
||||
std::string t = std::string(mapped + curPos, dataLen);
|
||||
cb.dataCallback(t.c_str(), dataLen);
|
||||
|
||||
curPos += dataLen;
|
||||
|
||||
}else if (stateType == URIType::HTTP){
|
||||
|
||||
bool res = downer.continueNonBlocking(cb);
|
||||
|
||||
if (res){
|
||||
if (downer.completed()){
|
||||
MEDIUM_MSG("completed");
|
||||
}else{
|
||||
if (supportRangeRequest){
|
||||
MEDIUM_MSG("do new range request, previous request not completed yet!, curpos: %llu, "
|
||||
"length: %llu",
|
||||
curPos, getSize());
|
||||
}
|
||||
}
|
||||
}else{
|
||||
Util::sleep(10);
|
||||
}
|
||||
}else{// streaming mode
|
||||
int s;
|
||||
static int totaal = 0;
|
||||
if ((downer.getSocket() && downer.getSocket().spool())){// || downer.getSocket().Received().size() > 0){
|
||||
s = downer.getSocket().Received().bytes(wantedLen);
|
||||
std::string buf = downer.getSocket().Received().remove(s);
|
||||
|
||||
cb.dataCallback(buf.data(), s);
|
||||
totaal += s;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/// Readsome blocking function.
|
||||
void URIReader::readSome(char *&dataPtr, size_t &dataLen, size_t wantedLen){
|
||||
if (stateType == URIType::File){
|
||||
|
||||
dataPtr = mapped + curPos;
|
||||
|
||||
if (wantedLen < totalSize){
|
||||
if ((wantedLen + curPos) > totalSize){
|
||||
dataLen = totalSize - curPos; // restant
|
||||
}else{
|
||||
dataLen = wantedLen;
|
||||
}
|
||||
}else{
|
||||
dataLen = totalSize;
|
||||
}
|
||||
|
||||
curPos += dataLen;
|
||||
}else if (stateType == URIType::HTTP){
|
||||
|
||||
dataLen = downer.data().size();
|
||||
curPos += dataLen;
|
||||
dataPtr = (char *)downer.data().data();
|
||||
}else{
|
||||
if (clearPointer){
|
||||
rPtr.assign(0, 0);
|
||||
clearPointer = false;
|
||||
dataLen = 0;
|
||||
rPtr.allocate(wantedLen);
|
||||
}
|
||||
|
||||
int s;
|
||||
bool run = true;
|
||||
while (downer.getSocket() && run){
|
||||
if (downer.getSocket().spool()){
|
||||
|
||||
if (wantedLen < 8000){
|
||||
s = downer.getSocket().Received().bytes(wantedLen);
|
||||
}else{
|
||||
s = downer.getSocket().Received().bytes(8000);
|
||||
}
|
||||
|
||||
std::string buf = downer.getSocket().Received().remove(s);
|
||||
rPtr.append(buf.c_str(), s);
|
||||
|
||||
dataLen += s;
|
||||
curPos += s;
|
||||
|
||||
if (rPtr.size() >= wantedLen){
|
||||
dataLen = rPtr.size();
|
||||
dataPtr = rPtr;
|
||||
// INFO_MSG("laatste stukje, datalen: %llu, wanted: %llu", dataLen,
|
||||
// wantedLen); dataCallback(ptr, len);
|
||||
clearPointer = true;
|
||||
run = false;
|
||||
}
|
||||
//}
|
||||
}else{
|
||||
// INFO_MSG("data not yet available!");
|
||||
return;
|
||||
}
|
||||
}
|
||||
|
||||
// if (!downer.getSocket()){
|
||||
totalSize = curPos;
|
||||
dataLen = rPtr.size();
|
||||
//}
|
||||
// INFO_MSG("size: %llu, datalen: %llu", totalSize, rPtr.size());
|
||||
dataPtr = rPtr;
|
||||
}
|
||||
}
|
||||
|
||||
void URIReader::close(){
|
||||
if (stateType == URIType::File){
|
||||
if (mapped){
|
||||
munmap(mapped, totalSize);
|
||||
mapped = 0;
|
||||
totalSize = 0;
|
||||
}
|
||||
}else if (stateType == URIType::Stream){
|
||||
downer.getSocket().close();
|
||||
}else if (stateType == URIType::HTTP){
|
||||
downer.getSocket().close();
|
||||
}else{
|
||||
// INFO_MSG("already closed");
|
||||
}
|
||||
}
|
||||
|
||||
void URIReader::onProgress(bool (*progressCallback)(uint8_t)){
|
||||
/// TODO: Implement
|
||||
}
|
||||
|
||||
void URIReader::setBounds(size_t newMinLen, size_t newMaxLen){
|
||||
minLen = newMinLen;
|
||||
maxLen = newMaxLen;
|
||||
}
|
||||
|
||||
bool URIReader::isSeekable(){
|
||||
if (stateType == URIType::HTTP){
|
||||
|
||||
if (supportRangeRequest && totalSize > 0){return true;}
|
||||
}
|
||||
|
||||
return (stateType == URIType::File);
|
||||
}
|
||||
|
||||
bool URIReader::isEOF(){
|
||||
if (stateType == URIType::File){
|
||||
return (curPos >= totalSize);
|
||||
}else if (stateType == URIType::Stream){
|
||||
if (!downer.getSocket()){return true;}
|
||||
|
||||
// if ((totalSize > 0) && (curPos >= totalSize)){return true;}
|
||||
}else if (stateType == URIType::HTTP){
|
||||
// INFO_MSG("iseof, C: %s, seekable: %s", C?"connected":"disconnected", isSeekable()?"yes":"no");
|
||||
if (!downer.getSocket() && !downer.getSocket().Received().available(1) && !isSeekable()){
|
||||
return true;
|
||||
}
|
||||
if ((totalSize > 0) && (curPos >= totalSize)){return true;}
|
||||
|
||||
// mark as complete if downer reports download is completed, or when socket connection is closed when totalsize is not known.
|
||||
if (downer.completed() || (!totalSize && !downer.getSocket())){
|
||||
// INFO_MSG("complete totalsize: %llu, %s", totalSize, downer.getSocket() ? "Connected" : "disconnected");
|
||||
return true;
|
||||
}
|
||||
|
||||
}else{
|
||||
return true;
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
bool URIReader::isGood() const{
|
||||
return true;
|
||||
/// TODO: Implement
|
||||
}
|
||||
|
||||
uint64_t URIReader::getPos(){return curPos;}
|
||||
|
||||
const HTTP::URL &URIReader::getURI() const{return myURI;}
|
||||
|
||||
size_t URIReader::getSize() const{return totalSize;}
|
||||
|
||||
}// namespace HTTP
|
83
lib/urireader.h
Normal file
83
lib/urireader.h
Normal file
|
@ -0,0 +1,83 @@
|
|||
#pragma once
|
||||
#include "downloader.h"
|
||||
#include "util.h"
|
||||
#include <fstream>
|
||||
namespace HTTP{
|
||||
|
||||
enum URIType{Closed = 0, File, Stream, HTTP};
|
||||
|
||||
/// Opens a generic URI for reading. Supports streams/pipes, HTTP(S) and file access.
|
||||
/// Supports seeking, partial and full reads; emulating behaviour where necessary.
|
||||
/// Calls progress callback for long-duration operations, if set.
|
||||
class URIReader : public Util::DataCallback{
|
||||
public:
|
||||
// Setters/initers
|
||||
|
||||
/// Sets the internal URI to the current working directory, but does not call open().
|
||||
URIReader();
|
||||
/// Calls open on the given uri during construction
|
||||
URIReader(const HTTP::URL &uri);
|
||||
/// Calls open on the given relative uri during construction
|
||||
/// URI is resolved relative to the current working directory
|
||||
URIReader(const std::string &reluri);
|
||||
/// Sets the internal URI to the given URI and opens it, whatever that may mean for the given URI type.
|
||||
bool open(const HTTP::URL &uri);
|
||||
/// Links the internal URI to the given relative URI and opens it, whatever that may mean for the current URI type.
|
||||
bool open(const std::string &reluri);
|
||||
/// Seeks to the given position, relative to fragment's #start=X value or 0 if not set.
|
||||
bool seek(const uint64_t pos);
|
||||
/// Reads all data from start to end, calling the dataCallback whenever minLen/maxLen require it.
|
||||
void readAll(size_t (*dataCallback)(const char *data, size_t len));
|
||||
|
||||
/// Reads all data from start to end, returning it in a single buffer with all data.
|
||||
void readAll(char *&dataPtr, size_t &dataLen);
|
||||
/// Reads all data from start to end, using callbacks
|
||||
void readAll(Util::DataCallback &cb);
|
||||
|
||||
/// Reads wantedLen bytes of data from current position, calling the dataCallback whenever minLen/maxLen require it.
|
||||
void readSome(size_t (*dataCallback)(const char *data, size_t len), size_t wantedLen);
|
||||
/// Reads wantedLen bytes of data from current position, returning it in a single buffer.
|
||||
void readSome(char *&dataPtr, size_t &dataLen, size_t wantedLen);
|
||||
|
||||
void readSome(size_t wantedLen, Util::DataCallback &cb);
|
||||
|
||||
/// Closes the currently open URI. Does not change the internal URI value.
|
||||
void close();
|
||||
|
||||
// Configuration setters
|
||||
/// Progress callback, called whenever transfer stalls. Not called if unset.
|
||||
void onProgress(bool (*progressCallback)(uint8_t));
|
||||
/// Sets minimum and maximum buffer size for read calls that use callbacks
|
||||
void setBounds(size_t minLen = 0, size_t maxLen = 0);
|
||||
|
||||
// Static getters
|
||||
bool isSeekable(); /// Returns true if seeking is possible in this URI.
|
||||
bool isEOF(); /// Returns true if the end of the URI has been reached.
|
||||
bool isGood() const; /// Returns true if more data can still be read.
|
||||
uint64_t getPos(); /// Returns the current byte position in the URI.
|
||||
const HTTP::URL &getURI() const; /// Returns the most recently open URI, or the current working directory if not set.
|
||||
size_t getSize() const; /// Returns the size of the currently open URI, if known. Returns std::string::npos if unknown size.
|
||||
|
||||
void (*httpBodyCallback)(const char *ptr, size_t size);
|
||||
void dataCallback(const char *ptr, size_t size);
|
||||
|
||||
private:
|
||||
// Internal state variables
|
||||
bool (*cbProgress)(uint8_t); /// The progress callback, if any. Not called if set to a null pointer.
|
||||
HTTP::URL myURI; /// The most recently open URI, or the current working directory if nothing has been opened yet.
|
||||
size_t minLen; /// Minimum buffer size for dataCallback.
|
||||
size_t maxLen; /// Maximum buffer size for dataCallback.
|
||||
size_t startPos; /// Start position for byte offsets.
|
||||
size_t endPos; /// End position for byte offsets.
|
||||
size_t totalSize; /// Total size in bytes of the current URI. May be incomplete before read finished.
|
||||
size_t curPos;
|
||||
char *mapped;
|
||||
bool supportRangeRequest;
|
||||
Util::ResizeablePointer rPtr;
|
||||
Util::ResizeablePointer allData;
|
||||
bool clearPointer;
|
||||
URIType stateType; /// Holds the type of URI this is, for internal processing purposes.
|
||||
std::ifstream fReader; /// For file-based URIs, the ifstream used for the file.
|
||||
HTTP::Downloader downer; /// For HTTP(S)-based URIs, the Downloader instance used for the download.
|
||||
};
|
||||
}// namespace HTTP
|
Loading…
Add table
Reference in a new issue