fastalgorithms · askhamwhat · Mar 26, 2025 · Oct 29, 2024 · Jan 6, 2025 · Feb 1, 2025
diff --git a/.gitmodules b/.gitmodules
@@ -1,6 +1,6 @@
 [submodule "FLAM"]
 	path = chunkie/FLAM
-	url = https://github.com/klho/FLAM.git
+	url = https://github.com/fastalgorithms/FLAM.git
 
 [submodule "chunkie/fmm2d"]
 	path = chunkie/fmm2d

diff --git a/chunkie/+chnk/+flam/nproxy_square.m b/chunkie/+chnk/+flam/nproxy_square.m
@@ -40,60 +40,53 @@
   srcinfo.d2 = randn(2,nsrc);
   srcinfo.n = [-srcinfo.d(2,:);srcinfo.d(1,:)] ./ sqrt(sum(srcinfo.d.^2,1));
 
-  npxy = 16;
+  stmp = [];
+  stmp.r = randn(2,1); stmp.d = randn(2,1); stmp.d2 = randn(2,1);
+  stmp.n = [-stmp.d(2,:);stmp.d(1,:)] ./ sqrt(sum(stmp.d.^2,1));
 
-				% double until you get enough
-  for i = 1:11
-    [pr,ptau] = chnk.flam.proxy_square_pts(npxy);
-    targinfo.r = pr*width;
+  ttmp = [];
+  ttmp.r = randn(2,1); ttmp.d = randn(2,1); ttmp.d2 = randn(2,1);
+  ttmp.n = [-ttmp.d(2,:);ttmp.d(1,:)] ./ sqrt(sum(ttmp.d.^2,1));
+
+  f = kern(stmp, ttmp);
+  [opdims(1), opdims(2)] = size(f);
+
+  % strengths of random sources
+  sig = randn(opdims(2)*nsrc,1);
+
+  npxy = 64;
+
+  % double until you get enough
+  last_intgrl = NaN;
+  one_more    = true;
+  for i = 0:14
+    [pr,ptau,pw] = chnk.flam.proxy_square_pts(npxy);
+    pwuse =  repmat(pw.', [opdims(1),1]); pwuse = pwuse(:);
+    targinfo.r = width*pr;
     targinfo.d = ptau;
     targinfo.d2 = zeros(2,npxy);
     targinfo.n = [-ptau(2,:);ptau(1,:)] ./ sqrt(sum(ptau.^2,1));
 
-    if npxy > nsrc
-      nsrc = ceil(1.2*npxy);
-      srcinfo = [];
-      srcinfo.r = [-0.5;-0.5]*width + rand(2,nsrc)*width;
-
-      srcinfo.d = randn(2,nsrc);
-      srcinfo.d2 = randn(2,nsrc);
-      srcinfo.n = [-srcinfo.d(2,:);srcinfo.d(1,:)] ./ sqrt(sum(srcinfo.d.^2,1));
-    end
-
-    mat = proxy_square_mat(kern,srcinfo,targinfo);
-
-    [sk,~] = id(mat,rank_or_tol);
-
-    if length(sk) < npxy 
-      npxy = floor((length(sk)-1)/4+1.1)*4;
+    % compute integral along proxy surface of potential from random sources
+    % to see if we've resolved the kernel
+    intgrl = pwuse' * kern(srcinfo,targinfo) * sig;
+
+    % check self convergence
+    err = abs(intgrl - last_intgrl) / abs(intgrl);
+    if err < rank_or_tol || ~one_more
       return;
     end
     npxy = 2*npxy;
-  end
-
-  % npxy is never smaller than nsrc... so no compression is happening... 
-  npxy = -1;
-
-end
-
-function mat = proxy_square_mat(kern,srcinfo,targinfo)
-
-  if numel(kern) == 1
-    mat = kern(srcinfo,targinfo);
-    return;
-  end
+    last_intgrl = intgrl;
 
-  % kern is a cellmat
-
-  [m,n] = size(kern);
-
-  mat = cell(m,n);
-
-  for i=1:m
-    for j=1:n
-      mat{i,j} = kern{i,j}(srcinfo,targinfo);
+    % if using very low tolerance like 1e-14, just get to 1e-12 error
+    % and double one more time to avoid mucking around at machine eps
+    if rank_or_tol < 1e-12 && err < 1e-12
+        one_more = false;
     end
   end
 
-  mat = cell2mat(mat);
-end
+  % kernel was not resolved even with 2^14 points, report failure
+  npxy = -1;
+
+end
diff --git a/chunkie/+chnk/+flam/proxy_square_pts.m b/chunkie/+chnk/+flam/proxy_square_pts.m
@@ -11,7 +11,6 @@
 %   pr - (2,porder) array of proxy point locations (centered at 0 for a 
 %           box of side length 1)
 
-
 if nargin < 1
     porder = 64;
 end
@@ -20,11 +19,10 @@
     opts = [];
 end
 
-iflege = 0;
+iflege = 1;
 if isfield(opts, 'iflege')
     iflege = opts.iflege;
 end
-
 
 assert(mod(porder,4) == 0, ...
     'number of proxy points on square should be multiple of 4')
@@ -33,21 +31,26 @@
 
 if ~iflege
     pts = -1.5+3*(0:(po4-1))*1.0/po4;
+    one = ones(size(pts));
     pw = ones(porder,1)*(4.0*3.0/porder);
 else
-    [xleg, wleg] = lege.exps(po4);
-    pts = xleg.'*1.5;
-    wleg = wleg*1.5;   
-    pw = [wleg; wleg; wleg; wleg];
+    % generate panel Gauss-Legendre rule on [-1.5, 1.5]
+    % because large single-panel rules lose digits
+    k = min(16, po4);
+    npanel = po4/k;
+    [pts, wts] = lege.exps(k);
+    panels = linspace(-1.5, 1.5, npanel + 1);
+    pts = reshape(panels(1:end-1) + 3/(2*npanel) * (pts + 1), 1, []);
+    wts = 3/(2*npanel) * repmat(wts, npanel, 1)';
+    one = ones(1,porder/4);
+    pw = repmat(wts', 4, 1);
 end
 
-one = ones(size(pts));
-
 pr = [pts, one*1.5, -pts, -1.5*one;
-    -1.5*one, pts, 1.5*one, -pts];
+      -1.5*one, pts, 1.5*one, -pts];
 
 ptau = [one, one*0, -one, one*0;
-    one*0, one, one*0, -one];
+        one*0, one, one*0, -one];
 
 pin = @(x) max(abs(x),[],1) < 1.5;
 

diff --git a/chunkie/+chnk/chunkerkerneval_smooth.m b/chunkie/+chnk/chunkerkerneval_smooth.m
@@ -166,10 +166,19 @@
         npxy = chnk.flam.nproxy_square(kerneval,width);
         [pr,ptau,pw,pin] = chnk.flam.proxy_square_pts(npxy);
 
-        pxyfun = @(rc,rx,cx,slf,nbr,l,ctr) chnk.flam.proxyfunr(rc,rx,slf,nbr,l, ...
-            ctr,chnkr,kerneval,opdims,pr,ptau,pw,pin);
+        verb = false; % TODO: make this an option to chunkerkerneval?
+        optsnpxy = []; optsnpxy.rank_or_tol = opts.eps;
+        pxyfun = @(lvl) proxyfunrbylevel(width,lvl,optsnpxy, ...
+            chnkr,kerneval,opdims,verb && opts.proxybylevel);
+        if ~opts.proxybylevel
+            % if not using proxy-by-level, always use pxyfunr from level 1
+            pxyfun = pxyfun(1);
+        end
 
-        optsifmm=[]; optsifmm.Tmax=Inf;
+        optsifmm=[]; 
+        optsifmm.Tmax=Inf; 
+        optsifmm.proxybylevel = opts.proxybylevel;
+        optsifmm.verb = verb;
         F = ifmm(matfun,targinfo_flam.r,xflam1,200,1e-14,pxyfun,optsifmm);
         fints = ifmm_mv(F,dens(:),matfun);
         fints = fints(:);
@@ -224,3 +233,16 @@
 end
 % sum(fints)
 end
+
+function pxyfunrlvl = proxyfunrbylevel(width,lvl,optsnpxy, ...
+    chnkr,kern,opdims,verb ...
+    )
+    npxy = chnk.flam.nproxy_square(kern,width/2^(lvl-1),optsnpxy);
+    [pr,ptau,pw,pin] = chnk.flam.proxy_square_pts(npxy);
+
+    if verb; fprintf('%3d | npxy = %i\n', lvl, npxy); end
+
+    % return the FLAM-style pxyfunr corresponding to lvl
+    pxyfunrlvl = @(rc,rx,cx,slf,nbr,l,ctr) chnk.flam.proxyfunr(rc,rx,slf,nbr,l, ...
+        ctr,chnkr,kern,opdims,pr,ptau,pw,pin);
+end
diff --git a/chunkie/FLAM b/chunkie/FLAM
diff --git a/chunkie/chunkerkerneval.m b/chunkie/chunkerkerneval.m
@@ -27,6 +27,12 @@
 %                   opts.flam supercedes opts.accel, if
 %                   both are true, then flam will be used. (false)
 %       opts.accel - if = true, use specialized fmm if defined 
+%                   for the kernel or use a generic FLAM fmm to accelerate
+%                   the smooth part of the eval. if false do direct. (true)
+%       opts.proxybylevel - if = true, determine the number of
+%                   necessary proxy points adaptively at each level of the 
+%                   factorization in ifmm. Typically needed only for 
+%                   moderate / high frequency problems. (false)
 %                   for the kernel, if it doesnt exist or if too few 
 %                   sources/targets, or if false, 
 %                   do direct. (true)
@@ -112,6 +118,7 @@
 opts_use.forcefmm = false;
 opts_use.fac = 1.0;
 opts_use.eps = 1e-12;
+opts_use.proxybylevel = false;
 cormat = [];
 if isfield(opts,'forcesmooth'); opts_use.forcesmooth = opts.forcesmooth; end
 if isfield(opts,'forceadap'); opts_use.forceadap = opts.forceadap; end
@@ -129,6 +136,7 @@
 if isfield(opts,'accel'); opts_use.accel = opts.accel; end
 if isfield(opts,'fac'); opts_use.fac = opts.fac; end
 if isfield(opts,'eps'); opts_use.eps = opts.eps; end
+if isfield(opts,'proxybylevel'); opts_use.proxybylevel = opts.proxybylevel; end
 
 % Assign appropriate object to targinfo
 targinfo = [];
@@ -466,4 +474,4 @@
 
 end
 
-end
+end
diff --git a/chunkie/fmm2d b/chunkie/fmm2d
diff --git a/devtools/test/flamopdimsTest.m b/devtools/test/flamopdimsTest.m
@@ -176,7 +176,6 @@
     ntot = size(A);
     A = A + eye(ntot);
 else
-
     A = chunkerflam(chnkrs, Kmat, 1, opts_loc); 
 end
+21 −4		ifmm/ifmm.m
+19 −2		rskel/rskel.m
+18 −1		rskelf/rskelf.m
+1 −11		.github/workflows/python.yml
+34 −0		.github/workflows/python_cmake.yml
+180 −0		CMakeLists.txt
+2 −12		docs/conf.py
+156 −1		docs/install.rst
+15 −15		docs/math.rst
+1 −1		docs/requirements.txt
+34 −0		pyproject.toml
+5 −0		python/CMakeLists.txt
+1 −0		python/fmm2dpy/__init__.py
+13 −13		python/fmm2dpy/fmm2d.py
+12 −366		src/biharmonic/bh2dterms.f
+0 −20		src/biharmonic/bhfmm2d.f
+0 −18		src/common/cdjseval2d.f
+1 −14		src/common/hank103.f
+2 −2		src/laplace/lfmm2dwrap.f
+5 −18		src/modified-biharmonic/mbhfmm2d.f
+8 −19		src/modified-biharmonic/mbhrouts2d.f
+0 −11		src/modified-biharmonic/mbhrouts2d.f.j2
+2 −4		src/stokes/stokkernels2d.f
-Original file line number
+Diff line change
@@ Expand Up / @@ -176,7 +176,6 @@ @@
         ntot = size(A);
         A = A + eye(ntot);
     else
         A = chunkerflam(chnkrs, Kmat, 1, opts_loc);
     end
@@ Expand Down @@