github.com/keybase/client/go@v0.0.0-20240309051027-028f7c731f8b/chat/unfurl/extractor_test.go (about)

     1  package unfurl
     2  
     3  import (
     4  	"context"
     5  	"fmt"
     6  	"testing"
     7  
     8  	"github.com/keybase/client/go/chat/globals"
     9  	"github.com/keybase/client/go/externalstest"
    10  	"github.com/keybase/client/go/protocol/chat1"
    11  	"github.com/keybase/client/go/protocol/gregor1"
    12  	"github.com/stretchr/testify/require"
    13  )
    14  
    15  const codeBlock = "```"
    16  
    17  func TestExtractor(t *testing.T) {
    18  	tc := externalstest.SetupTest(t, "chat_extractor", 1)
    19  	defer tc.Cleanup()
    20  	g := globals.NewContext(tc.G, &globals.ChatContext{})
    21  
    22  	uid := gregor1.UID([]byte{0, 1})
    23  	convID := chat1.ConversationID([]byte{0, 1})
    24  	settingsMod := NewSettings(g, newMemConversationBackedStorage())
    25  	extractor := NewExtractor(g)
    26  	type testCase struct {
    27  		message   string
    28  		mode      chat1.UnfurlMode
    29  		whitelist []string
    30  		result    []ExtractorHit
    31  	}
    32  	var maxCase string
    33  	var maxRes []ExtractorHit
    34  	for i := 0; i < extractor.maxHits+5; i++ {
    35  		maxCase += " http://www.wsj.com"
    36  	}
    37  	for i := 0; i < extractor.maxHits; i++ {
    38  		maxRes = append(maxRes, ExtractorHit{
    39  			URL: "http://www.wsj.com",
    40  			Typ: ExtractorHitUnfurl,
    41  		})
    42  	}
    43  	cases := []testCase{
    44  		{
    45  			message: "check out this lame post: http://www.twitter.com/mike/383878473873",
    46  			mode:    chat1.UnfurlMode_NEVER,
    47  		},
    48  		{
    49  			message: "check out this lame site: www.google.com",
    50  			mode:    chat1.UnfurlMode_ALWAYS,
    51  		},
    52  		{
    53  			message: maxCase,
    54  			mode:    chat1.UnfurlMode_ALWAYS,
    55  			result:  maxRes,
    56  		},
    57  		{
    58  			message: "check out this lame post: http://www.twitter.com/mike/383878473873",
    59  			mode:    chat1.UnfurlMode_ALWAYS,
    60  			result: []ExtractorHit{
    61  				{
    62  					URL: "http://www.twitter.com/mike/383878473873",
    63  					Typ: ExtractorHitUnfurl,
    64  				},
    65  			},
    66  		},
    67  		{
    68  			message: "check out this lame post: `http://www.twitter.com/mike/383878473873`",
    69  			mode:    chat1.UnfurlMode_ALWAYS,
    70  			result:  nil,
    71  		},
    72  		{
    73  			message: fmt.Sprintf(`%s
    74  			[mike@lisa-keybase]-[~/go/src/github.com/keybase/client/go] (mike/markdown)$ scraper https://www.wsj.com/articles/a-silicon-valley-tech-leader-walks-a-high-wire-between-the-u-s-and-china-1542650707?mod=hp_lead_pos4
    75  			2018/11/19 16:33:52 ++Chat: + Scraper: Scrape
    76  			2018/11/19 16:33:53 ++Chat: | Scraper: scrapeGeneric: pubdate: 2018-11-19T18:05:00.000Z
    77  			2018/11/19 16:33:53 ++Chat: | Scraper: scrapeGeneric: success: 1542650700
    78  			2018/11/19 16:33:53 ++Chat: - Scraper: Scrape -> ok [time=893.809968ms]
    79  			Title: A Silicon Valley Tech Leader Walks a High Wire Between the U.S. and China
    80  			Url: https://www.wsj.com/articles/a-silicon-valley-tech-leader-walks-a-high-wire-between-the-u-s-and-china-1542650707
    81  			SiteName: WSJ
    82  			PublishTime: 2018-11-19 13:05:00 -0500 EST
    83  			Description: Nvidia sells lots of artificial-intelligence chips in China. That creates a dilemma as the company tries to navigate political and trade tensions.
    84  			ImageUrl: https://images.wsj.net/im-37707/social,
    85  			FaviconUrl: https://s.wsj.net/media/wsj_apple-touch-icon-180x180.png
    86  			%s`, codeBlock, codeBlock),
    87  			mode:   chat1.UnfurlMode_ALWAYS,
    88  			result: nil,
    89  		},
    90  		{
    91  			message: "check out this lame post: `http://www.twitter.com/mike/383878473873` http://www.twitter.com/mike/MIKE",
    92  			mode:    chat1.UnfurlMode_ALWAYS,
    93  			result: []ExtractorHit{
    94  				{
    95  					URL: "http://www.twitter.com/mike/MIKE",
    96  					Typ: ExtractorHitUnfurl,
    97  				},
    98  			},
    99  		},
   100  		{
   101  			message: "check out this lame post: ```http://www.twitter.com/mike/383878473873````",
   102  			mode:    chat1.UnfurlMode_ALWAYS,
   103  			result:  nil,
   104  		},
   105  		{
   106  			message: "check out this lame post: http://www.twitter.com/mike/383878473873",
   107  			mode:    chat1.UnfurlMode_WHITELISTED,
   108  			result: []ExtractorHit{
   109  				{
   110  					URL: "http://www.twitter.com/mike/383878473873",
   111  					Typ: ExtractorHitPrompt,
   112  				},
   113  			},
   114  		},
   115  		{
   116  			message:   "check out this lame post: http://www.twitter.com/mike/383878473873",
   117  			mode:      chat1.UnfurlMode_WHITELISTED,
   118  			whitelist: []string{"twitter.com"},
   119  			result: []ExtractorHit{
   120  				{
   121  					URL: "http://www.twitter.com/mike/383878473873",
   122  					Typ: ExtractorHitUnfurl,
   123  				},
   124  			},
   125  		},
   126  		{
   127  			message:   "http://www.github.com/keybase/client check out this lame post: http://www.twitter.com/mike/383878473873",
   128  			mode:      chat1.UnfurlMode_WHITELISTED,
   129  			whitelist: []string{"twitter.com", "github.com"},
   130  			result: []ExtractorHit{
   131  				{
   132  					URL: "http://www.github.com/keybase/client",
   133  					Typ: ExtractorHitUnfurl,
   134  				},
   135  				{
   136  					URL: "http://www.twitter.com/mike/383878473873",
   137  					Typ: ExtractorHitUnfurl,
   138  				},
   139  			},
   140  		},
   141  	}
   142  	for _, tcase := range cases {
   143  		settings := chat1.NewUnfurlSettings()
   144  		settings.Mode = tcase.mode
   145  		for _, w := range tcase.whitelist {
   146  			settings.Whitelist[w] = true
   147  		}
   148  		require.NoError(t, settingsMod.Set(context.TODO(), uid, settings))
   149  		res, err := extractor.Extract(context.TODO(), uid, convID, 1, tcase.message, settingsMod)
   150  		require.NoError(t, err)
   151  		require.Equal(t, tcase.result, res)
   152  	}
   153  }
   154  
   155  func TestExtractorExemptions(t *testing.T) {
   156  	tc := externalstest.SetupTest(t, "chat_extractor", 1)
   157  	defer tc.Cleanup()
   158  	g := globals.NewContext(tc.G, &globals.ChatContext{})
   159  
   160  	uid := gregor1.UID([]byte{0, 1})
   161  	convID := chat1.ConversationID([]byte{0, 1})
   162  	msgID := chat1.MessageID(1)
   163  	extractor := NewExtractor(g)
   164  	settings := chat1.NewUnfurlSettings()
   165  	settings.Mode = chat1.UnfurlMode_WHITELISTED
   166  	settings.Whitelist["amazon.com"] = true
   167  	settingsMod := NewSettings(g, newMemConversationBackedStorage())
   168  
   169  	extractor.AddWhitelistExemption(context.TODO(), uid,
   170  		NewOneTimeWhitelistExemption(convID, msgID, "amazon.com"))
   171  	res, err := extractor.Extract(context.TODO(), uid, convID, msgID, "http://amazon.com", settingsMod)
   172  	require.NoError(t, err)
   173  	require.Equal(t, 1, len(res))
   174  	require.Equal(t, ExtractorHitUnfurl, res[0].Typ)
   175  	extractor.AddWhitelistExemption(context.TODO(), uid,
   176  		NewOneTimeWhitelistExemption(convID, msgID, "cnn.com"))
   177  	res, err = extractor.Extract(context.TODO(), uid, convID, msgID, "http://amazon.com", settingsMod)
   178  	require.NoError(t, err)
   179  	require.Equal(t, 1, len(res))
   180  	require.Equal(t, ExtractorHitPrompt, res[0].Typ)
   181  	res, err = extractor.Extract(context.TODO(), uid, convID, msgID, "http://cnn.com", settingsMod)
   182  	require.NoError(t, err)
   183  	require.Equal(t, 1, len(res))
   184  	require.Equal(t, ExtractorHitUnfurl, res[0].Typ)
   185  	res, err = extractor.Extract(context.TODO(), uid, convID, msgID, "http://cnn.com", settingsMod)
   186  	require.NoError(t, err)
   187  	require.Equal(t, 1, len(res))
   188  	require.Equal(t, ExtractorHitPrompt, res[0].Typ)
   189  
   190  	res, err = extractor.Extract(context.TODO(), uid, convID, msgID, "http://google.com", settingsMod)
   191  	require.NoError(t, err)
   192  	require.Equal(t, 1, len(res))
   193  	require.Equal(t, ExtractorHitPrompt, res[0].Typ)
   194  	extractor.AddWhitelistExemption(context.TODO(), uid,
   195  		NewSingleMessageWhitelistExemption(convID, msgID, "google.com"))
   196  	res, err = extractor.Extract(context.TODO(), uid, convID, msgID, "http://google.com", settingsMod)
   197  	require.NoError(t, err)
   198  	require.Equal(t, 1, len(res))
   199  	require.Equal(t, ExtractorHitUnfurl, res[0].Typ)
   200  	res, err = extractor.Extract(context.TODO(), uid, convID, msgID, "http://google.com", settingsMod)
   201  	require.NoError(t, err)
   202  	require.Equal(t, 1, len(res))
   203  	require.Equal(t, ExtractorHitUnfurl, res[0].Typ)
   204  
   205  	require.NoError(t, settingsMod.Set(context.TODO(), uid, settings))
   206  	res, err = extractor.Extract(context.TODO(), uid, convID, msgID, "http://amazon.com", settingsMod)
   207  	require.NoError(t, err)
   208  	require.Equal(t, 1, len(res))
   209  	require.Equal(t, ExtractorHitUnfurl, res[0].Typ)
   210  }