Erlang - 列表解析 - 填充记录

我有一个简单的记录结构，包含一个头（H）和一个数据行（D）1：N的列表。所有标题行必须以数字开头。所有的数据行都有一个前导空白。也可能有一些空行（E）必须忽略。Erlang - 列表解析 - 填充记录

L = [H, D, D, E, H, D, E, H, D, D, D].

我想创建一个记录列表：

-record(posting,{header,data}).

使用列表理解。最好的办法是做什么？

来源

2010-06-18 tbikeev

你应该做这样的事情：

make_records(L) when is_list(L) -> 
    F = fun([32|_]=D,{#posting{}=H,Acc}) -> {H,[H#posting{data=D}|Acc]}; 
     ([], Acc) -> Acc; 
     ([F|_]=H, {_,Acc}) when F=<$0, F>=$9 -> {#posting{header=>H}, Acc} 
     end, 
    {_, R} = lists:foldl(F, {undefined, []}, L), 
    R.

无论如何，我认为简单的Erlang版本似乎并不过于复杂的，应快一点。

make_records2(L) when is_list(L) -> 
    make_records2(L, undefined, []). 

make_records2([], _, R) -> R; 
make_records2([[32|_]=D|T], H, Acc) when is_list(H) -> 
    make_records2(T, H, [#posting{header=H,data=D}|Acc]); 
make_records2([[]|T], H, Acc) -> 
    make_records2(T, H, Acc); 
make_records2([[F|_]=H|T], _, Acc) when F>=$0, F=<$9 -> 
    make_records2(T, H, Acc).

编辑：如果您有更好的添加一行分类或对其进行解析，增加新的功能更好，因为它提高了可读性。

parse_row([Digit|_]=R) when Digit >= $0, Digit =< $9 -> {header, R}; 
parse_row(R) -> try_spaces(R). 

try_spaces([]) -> empty; 
try_spaces([Sp|R]) when Sp=:=$\s; Sp=:=$\t; Sp=:=$\n -> 
    try_spaces(R); % skip all white spaces from Data field 
try_spaces(Data) -> {data, Data}.

您可以使用它像这样：

make_records(L) when is_list(L) -> 
    F = fun(Row, {H, Acc}) -> 
      case parse_row(Row) of 
      {data, D} when is_record(H, posting) -> {H,[H#posting{data=D}|Acc]}; 
      empty -> Acc; 
      {header, H} -> {#posting{header=>H}, Acc} 
     end, 
    {_, R} = lists:foldl(F, {undefined, []}, L), 
    R.

尾递归本地二郎解决方案：

make_records2(L) when is_list(L) -> 
    make_records2([parse_row(R) || R<-L], undefined, []). 

make_records2([], _, R) -> R; 
make_records2([{data, D}|T], H, Acc) when is_list(H) -> 
    make_records2(T, H, [#posting{header=H,data=D}|Acc]); 
make_records2([empty|T], H, Acc) -> 
    make_records2(T, H, Acc); 
make_records2([{header,H}|T], _, Acc) -> 
    make_records2(T, H, Acc).

我认为有从性能的角度来看没有理由使用尾递归：

make_records3(L) when is_list(L) -> 
    make_records3(L, undefined). 

make_records3([], _) -> []; 
make_records3([R|T], H) -> 
    case parse_row(R) of 
    {data, D} when is_list(H) -> [#posting{head=H,data=D}|make_records3(T, H)]; 
    empty -> make_records3(T, H); 
    {header, H2} -> make_records3(T, H2) 
    end.

...以及许多其他变体。

来源

2010-06-18 10:16:04

在这种情况下，您必须使用列表：foldl/3而不是列表解析。随着与foldl/3，您可以通过整个列表积累头的值和数据L.

来源

2010-06-18 07:15:23

我需要折叠标题下的所有数据线 - 所以这里的那一刻是我：

sanitize(S) -> trim:trim(S). 

    make_records(L) when is_list(L) -> make_records(L, undefined, []). 

    make_records([], _, R) -> lists:reverse(R); 

    make_records([[32|_]=D|T], H, Acc) when is_tuple(H) -> 
     make_records(T, {element(1,H),[sanitize(D)|element(2,H)]},Acc); 

    make_records([[$\n|_]=D|T], H, Acc) when is_tuple(H) -> 
     make_records(T, H, Acc); 


    make_records([[F|_]=H|T], B, Acc) when F>=$0, F=<$9 -> 
     if is_tuple(B) -> 
      make_records(T, {sanitize(H),[]}, [#posting{header=element(1,B), 
      data=lists:reverse(element(2,B))}|Acc]); 
     true -> 
      make_records(T, {sanitize(H),[]}, Acc) 
     end.

来源

2010-06-20 12:32:14 tbikeev

Erlang - 列表解析 - 填充记录

回答

相关问题