File: jdlink.m

package info (click to toggle)
octave-iso2mesh 1.9.8%2Bds-2
  • links: PTS, VCS
  • area: main
  • in suites: sid, trixie
  • size: 11,128 kB
  • sloc: cpp: 11,982; ansic: 10,158; sh: 365; makefile: 59
file content (115 lines) | stat: -rw-r--r-- 4,049 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
function varargout = jdlink(uripath, varargin)
%
%    data = jdlink(uripath)
%       or
%    [data, fname, cachepath] = jdlink(uripath, 'param1', value1, ...)
%
%    Download linked data files from URLs and store those in cached folders
%
%    author: Qianqian Fang (q.fang <at> neu.edu)
%
%    input:
%        uripath: a single string or a cell array of strings, containing
%                the http:// or https:// links pointing to the linked
%                resources
%        'param'/value pairs: (optional) additional options are supported,
%                including
%            showlink: [1]: print URL or cached file; 0 do not print.
%            showsize: [1]: print the total size of the linked files; 0 do not print.
%            regex: a regular expression that is used to filter the URL
%                 cell array; only those matching the pattern are being
%                 downloaded; this has no effect to a single URL input
%
%    output:
%        data: a cell array storing the parsed data of each linked file
%        fname: a cell array listing the path to each locally cached files
%        cachepath: a cell array listing the cache search path orders
%
%    examples:
%        data = loadjson('https://neurojson.io:7777/openneuro/ds000001');
%        anatfiles = jsonpath(data, '$..anat.._DataLink_');
%        data = jdlink(anatfiles, 'regex', 'sub-0[12].*\.nii');
%        jsonpath(data, '$..Dim')
%
%    license:
%        BSD or GPL version 3, see LICENSE_{BSD,GPLv3}.txt files for details
%
% -- this function is part of JSONLab toolbox (http://iso2mesh.sf.net/cgi-bin/index.cgi?jsonlab)
%

opt = varargin2struct(varargin{:});
opt.showlink = jsonopt('showlink', 1, opt);
opt.showsize = jsonopt('showsize', 1, opt);

if (iscell(uripath))
    if (isfield(opt, 'regex'))
        haspattern = cellfun(@(x) isempty(regexp(x, opt.regex, 'once')), uripath);
        uripath(haspattern) = [];
    end
    if (isfield(opt, 'showsize'))
        totalsize = 0;
        nosize = 0;
        for i = 1:length(uripath)
            filesize = regexp(uripath{i}, '&size=(\d+)', 'tokens');
            if (~isempty(filesize) && ~isempty(filesize{1}))
                totalsize = totalsize + str2double(filesize{1});
            else
                nosize = nosize + 1;
            end
        end
        fprintf('total %d links, %.0f bytes, %d files with unknown size\n', length(uripath), totalsize, nosize);
    end
    alloutput = cell(1, nargout);
    for i = 1:length(uripath)
        [newdata, fname, cachepath] = downloadlink(uripath{i}, opt);
        if (nargout > 0)
            alloutput{1}{end + 1} = newdata;
            if (nargout > 1)
                alloutput{2}{end + 1} = fname;
                if (nargout > 2)
                    alloutput{3}{end + 1} = cachepath;
                end
            end
        end
    end
    if (length(uripath) == 1)
        alloutput = cellfun(@(x) x{1}, alloutput, 'UniformOutput', false);
    end
    varargout = alloutput;
elseif (ischar(uripath) || isa(uripath, 'string'))
    [varargout{1:nargout}] = downloadlink(uripath, opt);
end

%%
function [newdata, fname, cachepath] = downloadlink(uripath, opt)
newdata = [];
[cachepath, filename] = jsoncache(uripath);
if (iscell(cachepath) && ~isempty(cachepath))
    if (opt.showlink)
        fprintf(1, 'downloading from URL: %s\n', uripath);
    end

    fname = [cachepath{1} filesep filename];
    fpath = fileparts(fname);
    if (~exist(fpath, 'dir'))
        mkdir(fpath);
    end
    if (exist('websave'))
        websave(fname, uripath);
    else
        rawdata = urlread(uripath);
        fid = fopen(fname, 'wb');
        if (fid == 0)
            error('can not save URL to cache at path %s', fname);
        end
        fwrite(fid, uint8(rawdata));
        fclose(fid);
    end
    newdata = loadjd(fname, opt);
elseif (~iscell(cachepath) && exist(cachepath, 'file'))
    if (opt.showlink)
        fprintf(1, 'loading from cache: %s\n', cachepath);
    end
    fname = cachepath;
    newdata = loadjd(fname, opt);
end