From 233d1cc2eb70514a4005cd869b6ad478b7440b73 Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 13:15:15 -0400
Subject: [PATCH 01/10] Remove info_file option from ImageFileCollection

Fixes #679 by removing the ability to initialize from a table.
---
 ccdproc/image_collection.py            | 47 +-----------
 ccdproc/tests/test_image_collection.py | 98 --------------------------
 2 files changed, 3 insertions(+), 142 deletions(-)

diff --git a/ccdproc/image_collection.py b/ccdproc/image_collection.py
index 500ad573..5d0aa509 100644
--- a/ccdproc/image_collection.py
+++ b/ccdproc/image_collection.py
@@ -48,15 +48,6 @@ class ImageFileCollection(object):
         columns. Default value is '*' unless ``info_file`` is specified.
         Default is ``None``.
 
-    info_file : str or None, optional
-        Path to file that contains a table of information about FITS files.
-        In this case the keywords are set to the names of the columns of the
-        ``info_file`` unless ``keywords`` is explicitly set to a different
-        list.
-        Default is ``None``.
-
-        .. deprecated:: 1.3
-
     filenames: str, list of str, or None, optional
         List of the names of FITS files which will be added to the collection.
         The filenames are assumed to be in ``location``.
@@ -84,13 +75,8 @@ class ImageFileCollection(object):
         Raised if keywords are set to a combination of '*' and any other
         value.
     """
-    def __init__(self, location=None, keywords=None, info_file=None,
+    def __init__(self, location=None, keywords=None,
                  filenames=None, glob_include=None, glob_exclude=None, ext=0):
-
-        if info_file is not None:
-            warnings.warn("The 'info_file' argument is deprecated and will be "
-                          "removed in a future version", DeprecationWarning)
-
         # Include or exclude files from the collection based on glob pattern
         # matching - has to go above call to _get_files()
         if glob_exclude is not None:
@@ -104,7 +90,6 @@ def __init__(self, location=None, keywords=None, info_file=None,
         self._location = location
         self._filenames = filenames
         self._files = []
-        self._info_file = info_file
         if location:
             self._files = self._get_files()
 
@@ -113,29 +98,8 @@ def __init__(self, location=None, keywords=None, info_file=None,
                           AstropyUserWarning)
         self._summary = {}
         if keywords is None:
-            if info_file is not None:
-                # Default to empty list so that keywords will be populated
-                # from table columns names.
-                keywords = []
-            else:
-                # Otherwise use all keywords.
-                keywords = '*'
-        if info_file is not None:
-            try:
-                info_path = path.join(self.location, info_file)
-            except (AttributeError, TypeError):
-                info_path = info_file
-            try:
-                self._summary = Table.read(info_path, format='ascii',
-                                           delimiter=',')
-                self._summary = Table(self._summary, masked=True)
-            except IOError:
-                if location:
-                    logger.warning('unable to open table file %s, will try '
-                                   'initializing from location instead.',
-                                   info_path)
-                else:
-                    raise
+            # Use all keywords.
+            keywords = '*'
 
         # Used internally to keep track of whether the user asked for all
         # keywords or a specific list. The keywords setter takes care of
@@ -159,11 +123,6 @@ def __repr__(self):
         else:
             kw = "keywords={!r}".format(self.keywords[1:])
 
-        if self._info_file is None:
-            infofile = ''
-        else:
-            infofile = "info_file={!r}".format(self._info_file)
-
         if self.glob_exclude is None:
             glob_exclude = ''
         else:
diff --git a/ccdproc/tests/test_image_collection.py b/ccdproc/tests/test_image_collection.py
index 07aaa0f5..ce31a559 100644
--- a/ccdproc/tests/test_image_collection.py
+++ b/ccdproc/tests/test_image_collection.py
@@ -92,24 +92,6 @@ def test_repr_ext(self, triage_setup):
                .format(triage_setup.test_dir))
         assert repr(ic) == ref
 
-    def test_repr_info(self, triage_setup):
-        summary_file_path = os.path.join(triage_setup.test_dir, 'info.csv')
-        ic = ImageFileCollection(
-            location=triage_setup.test_dir, keywords=['naxis'])
-        ic.summary.write(summary_file_path)
-        with catch_warnings() as w:
-            ic2 = ImageFileCollection(info_file=summary_file_path)
-        # ImageFileCollections from info_files contain no files. That issues
-        # a Warning that we'll ignore here.
-        assert len(w) == 2
-        assert "'info_file' argument is deprecated" in str(w[0].message)
-        assert 'no FITS files in the collection' in str(w[1].message)
-
-        ref = ("ImageFileCollection(keywords=['naxis'], info_file={0!r})"
-               .format(summary_file_path))
-        assert repr(ic2) == ref
-
-
 # This should work mark all test methods as using the triage_setup
 # fixture, but it doesn't, so the fixture is given explicitly as an
 # argument to each method.
@@ -586,86 +568,6 @@ def test_setting_write_location_to_bad_dest_raises_error(self, tmpdir,
             for hdr in ic.headers(save_location=bad_directory.strpath):
                 pass
 
-    def test_initializing_from_table(self, triage_setup):
-        keys = ['imagetyp', 'filter']
-        ic = ImageFileCollection(triage_setup.test_dir, keywords=keys)
-        table = ic.summary
-        table_path = os.path.join(triage_setup.test_dir, 'input_tbl.csv')
-        nonsense = 'forks'
-        table['imagetyp'][0] = nonsense
-        table.write(table_path, format='ascii', delimiter=',')
-        with catch_warnings() as w:
-            ic = ImageFileCollection(location=None, info_file=table_path)
-        # By using location=None we don't have actual files in the collection.
-        assert len(w) == 2
-        assert "'info_file' argument is deprecated" in str(w[0].message)
-        assert str(w[1].message) == "no FITS files in the collection."
-
-        # keywords can only have been set from saved table
-        for key in keys:
-            assert key in ic.keywords
-        # no location, so should be no files
-        assert len(ic.files) == 0
-        # no location, so no way to iterate over files
-        with pytest.raises((AttributeError, TypeError)):
-            for h in ic.headers():
-                pass
-        with catch_warnings() as w:
-            ic = ImageFileCollection(location=triage_setup.test_dir,
-                                     info_file=table_path)
-        assert len(w) == 1
-        assert "'info_file' argument is deprecated" in str(w[0].message)
-        # we now have a location, so did we get files?
-        assert len(ic.files) == len(table)
-        # Is the summary table masked?
-        assert ic.summary.masked
-        # can I loop over headers?
-        for h in ic.headers():
-            assert isinstance(h, fits.Header)
-        # Does ImageFileCollection summary contain values from table?
-        assert nonsense in ic.summary['imagetyp']
-
-    def test_initializing_from_table_file_that_does_not_exist(
-            self, triage_setup, tmpdir):
-        log = tmpdir.join('tmp.log')
-
-        self._setup_logger(log.strpath)
-
-        # Do we get a warning if we try reading a file that doesn't exist,
-        # but where we can initialize from a directory?
-        with catch_warnings() as w:
-            ic = ImageFileCollection(
-                location=triage_setup.test_dir,
-                info_file='iufadsdhfasdifre')
-        assert len(w) == 1
-        assert "'info_file' argument is deprecated" in str(w[0].message)
-
-        with open(log.strpath) as f:
-            warnings = f.readlines()
-
-        assert (len(warnings) == 1)
-        is_in = ['unable to open table file' in w for w in warnings]
-        assert all(is_in)
-        # Do we raise an error if the table name is bad AND the location
-        # is None?
-        with pytest.raises(IOError):
-            # Because the location is None we get a Warning about "no files in
-            # the collection".
-            with catch_warnings() as w:
-                ImageFileCollection(location=None, info_file='iufadsdhfasdifre')
-        assert len(w) == 2
-        assert "'info_file' argument is deprecated" in str(w[0].message)
-        assert str(w[1].message) == "no FITS files in the collection."
-
-        # Do we raise an error if the table name is bad AND
-        # the location is given but is bad?
-        with pytest.raises(OSError):
-            with catch_warnings() as w:
-                ic = ImageFileCollection(location='dasifjoaurun',
-                                         info_file='iufadsdhfasdifre')
-        assert len(w) == 1
-        assert "'info_file' argument is deprecated" in str(w[0].message)
-
     def test_no_fits_files_in_collection(self):
         with catch_warnings(AstropyUserWarning) as warning_lines:
             # FIXME: What exactly does this assert?

From 3073c56b5597c04794dfbf9b54160ac563656e6d Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 13:18:59 -0400
Subject: [PATCH 02/10] Allow collections set up from a list of files with no
 location

Fixes #374 and Fixes #661
Main change is how we handle a location of None.
---
 ccdproc/image_collection.py            | 22 ++++++--
 ccdproc/tests/test_image_collection.py | 76 +++++++++++++++++++++++++-
 2 files changed, 91 insertions(+), 7 deletions(-)

diff --git a/ccdproc/image_collection.py b/ccdproc/image_collection.py
index 5d0aa509..9754b601 100644
--- a/ccdproc/image_collection.py
+++ b/ccdproc/image_collection.py
@@ -87,11 +87,14 @@ def __init__(self, location=None, keywords=None,
             glob_include = str(glob_include)
         self._glob_include = glob_include
 
-        self._location = location
+        if location is not None:
+            self._location = location
+        else:
+            self._location = ''
+
         self._filenames = filenames
         self._files = []
-        if location:
-            self._files = self._get_files()
+        self._files = self._get_files()
 
         if self._files == []:
             warnings.warn("no FITS files in the collection.",
@@ -143,7 +146,7 @@ def __repr__(self):
         else:
             filenames = "filenames={}".format(self._filenames)
 
-        params = [location, kw, infofile, filenames, glob_include, glob_exclude, ext]
+        params = [location, kw, filenames, glob_include, glob_exclude, ext]
         params = ', '.join([p for p in params if p])
 
         str_repr = "{self.__class__.__name__}({params})".format(
@@ -450,12 +453,19 @@ def _add_val_to_dict(key, value, tbl_dict, n_previous, missing_marker):
 
         assert 'file' not in h
 
+        if self.location:
+            # We have a location and can reconstruct the path using it
+            name_for_file_column = path.basename(file_name)
+        else:
+            # No location, so use whatever path the user passed in
+            name_for_file_column = file_name
+
         # Try opening header before this so that file name is only added if
         # file is valid FITS
         try:
-            summary['file'].append(path.basename(file_name))
+            summary['file'].append(name_for_file_column)
         except KeyError:
-            summary['file'] = [path.basename(file_name)]
+            summary['file'] = [name_for_file_column]
 
         missing_in_this_file = [k for k in summary if (k not in h and
                                                        k != 'file')]
diff --git a/ccdproc/tests/test_image_collection.py b/ccdproc/tests/test_image_collection.py
index ce31a559..d1554255 100644
--- a/ccdproc/tests/test_image_collection.py
+++ b/ccdproc/tests/test_image_collection.py
@@ -2,8 +2,9 @@
 
 import os
 from shutil import rmtree
-from tempfile import mkdtemp
+from tempfile import mkdtemp, TemporaryDirectory
 from glob import iglob
+from pathlib import Path
 import logging
 import pytest
 
@@ -809,3 +810,76 @@ def test_that_test_files_have_expected_properties(self, triage_setup):
 
         for column in expected.colnames:
             assert np.all(actual[column] == expected[column])
+
+    def test_image_collection_with_no_location(self, triage_setup):
+        # Test for a feature requested in
+        #
+        #     https://github.com/astropy/ccdproc/issues/374
+        #
+        # Create a collection from a list of file names (which can include
+        # path as needed)
+
+        source_path = Path(triage_setup.test_dir)
+
+        # Put the first three files in source_path into temp_path below
+        # then create the image collection out of the three in temp_path and the
+        # rest in source_path.
+        source_files = [p for p in source_path.iterdir()]
+
+        move_to_temp = source_files[:3]
+        keep_in_source = source_files[3:]
+
+        with TemporaryDirectory() as td:
+            temp_dir = Path(td)
+            file_paths = []
+            for source in move_to_temp:
+                temp_path = temp_dir / source.name
+                temp_path.write_bytes(source.read_bytes())
+                file_paths.append(str(temp_path))
+            file_paths.extend(str(p) for p in keep_in_source)
+
+            # Move up a level to make sure we are not accidentally
+            # pulling in files from the current working directory,
+            # which includes everythin in source.
+            os.chdir('..')
+
+            ic = ImageFileCollection(filenames=file_paths)
+            assert len(ic.summary) == len(file_paths)
+
+            expected_name = \
+                get_pkg_data_filename('data/expected_ifc_file_properties.csv')
+            expected = Table.read(expected_name)
+
+            # Make the comparison more reliable by sorting
+            expected.sort('file')
+
+            actual = ic.summary
+
+            # Write the actual IFC summary out to disk to turn bool into strings
+            # of"True" and "False", and any other non-essential differences
+            # between the tables.
+            tmp_file = 'actual.csv'
+            actual.write(tmp_file)
+            actual = Table.read(tmp_file)
+            # Make the comparison more reliable by sorting...but the actual
+            # in this case includes paths, so we really want to sort by the
+            # base name of the file.
+            bases = np.array([Path(f).name for f in actual['file']])
+            sort_order = np.argsort(bases)
+            actual = actual[sort_order]
+            bases = bases[sort_order]
+
+            assert all(Path(f).exists() for f in actual['file'])
+
+            for column in expected.colnames:
+                if column == 'file':
+                    assert np.all(bases == expected[column])
+                else:
+                    assert np.all(actual[column] == expected[column])
+
+            # Set comparisons don't care about order :)
+            # Check several of the ways we can get file names from the
+            # collection and ensure all of them include the path.
+            assert set(file_paths) == set(ic.summary['file'])
+            assert set(file_paths) == set(ic.files)
+            assert set(file_paths) == set(ic.files_filtered(include_path=True))

From 2ee289821ac748fcc2fb1f05a0ab19fe18df6653 Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 14:38:58 -0400
Subject: [PATCH 03/10] Add test for #662

Fixes #662 (though to be honest I was not able to reproduce it)
---
 ccdproc/tests/test_image_collection.py | 15 +++++++++++++--
 1 file changed, 13 insertions(+), 2 deletions(-)

diff --git a/ccdproc/tests/test_image_collection.py b/ccdproc/tests/test_image_collection.py
index d1554255..44b75ab1 100644
--- a/ccdproc/tests/test_image_collection.py
+++ b/ccdproc/tests/test_image_collection.py
@@ -816,14 +816,18 @@ def test_image_collection_with_no_location(self, triage_setup):
         #
         #     https://github.com/astropy/ccdproc/issues/374
         #
+        # and fix the bug reported in
+        #
+        #     https://github.com/astropy/ccdproc/issues/662
+        #
         # Create a collection from a list of file names (which can include
         # path as needed)
 
         source_path = Path(triage_setup.test_dir)
 
         # Put the first three files in source_path into temp_path below
-        # then create the image collection out of the three in temp_path and the
-        # rest in source_path.
+        # then create the image collection out of the three in temp_path and
+        # the rest in source_path.
         source_files = [p for p in source_path.iterdir()]
 
         move_to_temp = source_files[:3]
@@ -883,3 +887,10 @@ def test_image_collection_with_no_location(self, triage_setup):
             assert set(file_paths) == set(ic.summary['file'])
             assert set(file_paths) == set(ic.files)
             assert set(file_paths) == set(ic.files_filtered(include_path=True))
+
+            # Spot check a couple of dtypes as a test for
+            #   https://github.com/astropy/ccdproc/issues/662
+
+            assert ic.summary['extend'].dtype == 'bool'
+            assert ic.summary['naxis1'].dtype == 'int64'
+            assert ic.summary['exptime'].dtype == 'float64'

From 4cd7669b2828121806894b3068b2520bbdd7de0c Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 14:54:02 -0400
Subject: [PATCH 04/10] Revise documentation for ImageFileCollection

---
 ccdproc/image_collection.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/ccdproc/image_collection.py b/ccdproc/image_collection.py
index 9754b601..db670f2c 100644
--- a/ccdproc/image_collection.py
+++ b/ccdproc/image_collection.py
@@ -50,7 +50,8 @@ class ImageFileCollection(object):
 
     filenames: str, list of str, or None, optional
         List of the names of FITS files which will be added to the collection.
-        The filenames are assumed to be in ``location``.
+        The filenames may either be in ``location`` or the name can be a
+        relative or absolute path to the file.
         Default is ``None``.
 
     glob_include: str or None, optional

From 881ad4901791854019ea0d97108c4a251e185eef Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 15:25:25 -0400
Subject: [PATCH 05/10] Add option to initialize ImageFileCollection based on
 file contents

instead of just extensions. Fixes #620
---
 ccdproc/image_collection.py            | 28 ++++++++++---
 ccdproc/tests/test_image_collection.py | 57 ++++++++++++++++++++++++++
 docs/ccdproc/image_management.rst      | 13 ++++++
 3 files changed, 93 insertions(+), 5 deletions(-)

diff --git a/ccdproc/image_collection.py b/ccdproc/image_collection.py
index db670f2c..20663182 100644
--- a/ccdproc/image_collection.py
+++ b/ccdproc/image_collection.py
@@ -48,6 +48,12 @@ class ImageFileCollection(object):
         columns. Default value is '*' unless ``info_file`` is specified.
         Default is ``None``.
 
+    find_fits_by_reading: bool, optional
+        If ``True``, read each file in location to check whether the file is a
+        FITS file and include it in the collection based on that, rather than
+        by file name. Compressed files, e.g. image.fits.gz, will **NOT** be
+        properly detected. *Will be ignored if `filenames` is not ``None``.*
+
     filenames: str, list of str, or None, optional
         List of the names of FITS files which will be added to the collection.
         The filenames may either be in ``location`` or the name can be a
@@ -66,9 +72,9 @@ class ImageFileCollection(object):
         easily select subsets of files in the target directory.
         Default is ``None``.
 
-     ext: str or int, optional
-         The extension from which the header and data will be read in all files.
-         Default is ``0``.
+    ext: str or int, optional
+        The extension from which the header and data will be read in all
+        files.Default is ``0``.
 
     Raises
     ------
@@ -76,7 +82,9 @@ class ImageFileCollection(object):
         Raised if keywords are set to a combination of '*' and any other
         value.
     """
+
     def __init__(self, location=None, keywords=None,
+                 find_fits_by_reading=False,
                  filenames=None, glob_include=None, glob_exclude=None, ext=0):
         # Include or exclude files from the collection based on glob pattern
         # matching - has to go above call to _get_files()
@@ -93,6 +101,8 @@ def __init__(self, location=None, keywords=None,
         else:
             self._location = ''
 
+        self._find_fits_by_reading = find_fits_by_reading
+
         self._filenames = filenames
         self._files = []
         self._files = self._get_files()
@@ -708,8 +718,16 @@ def _fits_files_in_directory(self, extensions=None,
 
         all_files = listdir(self.location)
         files = []
-        for extension in full_extensions:
-            files.extend(fnmatch.filter(all_files, '*' + extension))
+        if not self._find_fits_by_reading:
+            for extension in full_extensions:
+                files.extend(fnmatch.filter(all_files, '*' + extension))
+        else:
+            for file in all_files:
+                with open(file, 'rb') as fp:
+                    # Hmm, first argument to is_fits is not actually used in
+                    # that function. *shrug*
+                    if fits.connect.is_fits('just some junk', file, fp):
+                        files.append(file)
 
         files.sort()
         return files
diff --git a/ccdproc/tests/test_image_collection.py b/ccdproc/tests/test_image_collection.py
index 44b75ab1..021e478f 100644
--- a/ccdproc/tests/test_image_collection.py
+++ b/ccdproc/tests/test_image_collection.py
@@ -894,3 +894,60 @@ def test_image_collection_with_no_location(self, triage_setup):
             assert ic.summary['extend'].dtype == 'bool'
             assert ic.summary['naxis1'].dtype == 'int64'
             assert ic.summary['exptime'].dtype == 'float64'
+
+            expected_heads = (actual['imagetyp'] == 'LIGHT').sum()
+
+            n_heads = 0
+            # Try one of the generators
+            for h in ic.headers(imagetyp='light'):
+                assert h['imagetyp'].lower() == 'light'
+                n_heads += 1
+
+            assert n_heads == expected_heads
+
+    def test_force_detect_fits_files_finds_fits_files(self, triage_setup):
+        # Tests for new feature
+        #
+        #     https://github.com/astropy/ccdproc/issues/620
+        #
+        # which supports adding all of the FITS files in a location based on
+        # their *contents* instead of their *extension*.
+
+        # Grab files from the default collection and make a copy with a new name
+        # (and with no fits-like extension)
+        #
+        # Making a copy of *every* file means we can just double the expected
+        # number of files as part of the tests.
+        path = Path(triage_setup.test_dir)
+        for idx, p in enumerate(path.iterdir()):
+            new_name = 'no_extension{}'.format(idx)
+            (path / new_name).write_bytes(p.read_bytes())
+
+        ic = ImageFileCollection(location=str(path),
+                                 find_fits_by_reading=True)
+
+        # Compressed files won't be automagically detected by reading the
+        # first few bytes.
+        expected_number = (2 * triage_setup.n_test['files'] -
+                           triage_setup.n_test['compressed'])
+
+        assert len(ic.summary) == expected_number
+
+        n_bias = (ic.summary['imagetyp'] == 'BIAS').sum()
+        assert n_bias == 2 * triage_setup.n_test['bias']
+
+        # Only one file in the original set of test files has exposure time
+        # 15, so there should be two now.
+        assert len(ic.files_filtered(exptime=15.0)) == 2
+
+        # Try one of the generators
+        expected_heads = (2 * triage_setup.n_test['light'] -
+                          triage_setup.n_test['compressed'])
+
+        n_heads = 0
+
+        for h in ic.headers(imagetyp='light'):
+            assert h['imagetyp'].lower() == 'light'
+            n_heads += 1
+
+        assert n_heads == expected_heads
diff --git a/docs/ccdproc/image_management.rst b/docs/ccdproc/image_management.rst
index 210e1f0a..83960116 100644
--- a/docs/ccdproc/image_management.rst
+++ b/docs/ccdproc/image_management.rst
@@ -31,6 +31,15 @@ collection to use all keywords in the headers::
 
     >>> ic_all = ImageFileCollection('.', keywords='*')
 
+Normally identification of FITS files is done by looking at the file extension
+and including all files with the correct extension.
+
+If the files are not compressed (e.g. not gzipped) then you can force the image
+collection to open each file and check from its contents whether it is FITS by
+using the ``find_fits_by_reading`` argument::
+
+    >> ic_from_content = ImageFileCollection('.', find_fits_by_reading=True)
+
 You can indicate filename patterns to include or exclude using Unix shell-style
 expressions. For example, to include all filenames that begin with ``1d_`` but
 not ones that include the word ``bad``, you could do::
@@ -38,6 +47,10 @@ not ones that include the word ``bad``, you could do::
     >>> ic_all = ImageFileCollection('.', glob_include='1d_*',
     ...                              glob_exclude='*bad*')
 
+Alternatively, you can create the collection with an explicit list of file names::
+
+    >>> ic_names = ImageFileCollection(filenames=['a.fits', 'b.fits.gz'])
+
 Most of the useful interaction with the image collection is via its
 ``.summary`` property, a :class:`~astropy.table.Table` of the value of each keyword for each
 file in the collection::

From f33d47d5845e38cf4526ba9376d70d81ca17ec89 Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 15:51:46 -0400
Subject: [PATCH 06/10] Add regression test for #607

Fixes #607 even though this code was not what did the fix. This does add
a check for the issue.
---
 ccdproc/tests/test_image_collection.py | 38 ++++++++++++++++++++++++++
 1 file changed, 38 insertions(+)

diff --git a/ccdproc/tests/test_image_collection.py b/ccdproc/tests/test_image_collection.py
index 021e478f..2f922cfb 100644
--- a/ccdproc/tests/test_image_collection.py
+++ b/ccdproc/tests/test_image_collection.py
@@ -951,3 +951,41 @@ def test_force_detect_fits_files_finds_fits_files(self, triage_setup):
             n_heads += 1
 
         assert n_heads == expected_heads
+
+    def test_less_strict_verify_option(self, triage_setup):
+        # Tests for feature request
+        #
+        #    https://github.com/astropy/ccdproc/issues/607
+        #
+        # which would allow reading of otherwise invalid FITS headers.
+
+        bad_header = """
+            NAXIS1  =                   10 / length of data axis 1
+            NAXIS2  =                   10 / length of data axis 2
+            TESTVERI= '2017/02/13-16:51:38 / Test VerifyWarning
+        """
+
+        testh = fits.Header.fromstring(bad_header)
+        print(testh)
+        testfits = fits.PrimaryHDU(data=np.ones((10, 10)), header=testh)
+
+        path = Path(triage_setup.test_dir)
+        bad_fits_name = 'test_warnA.fits'
+        testfits.writeto(path / bad_fits_name,
+                         output_verify='warn',
+                         overwrite=True)
+
+        ic = ImageFileCollection(location=str(path))
+        print(ic.summary.colnames)
+        assert bad_fits_name in ic.files
+
+        # Turns out this sample header is so messed up that TESTVERI does not
+        # end up as a keyword.
+        assert 'TESTVERI' not in ic.summary.colnames
+
+        # This does end up as a key some how *shrug*.
+        assert '17/02/13' in ic.summary.colnames
+
+        # Try making the summary as in the original bug report
+        ic = ImageFileCollection(location=str(path),
+                                 glob_include='*warnA*')

From 7b41fd6520f1d338ee150a5ff733d73b85d286b9 Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 16:04:26 -0400
Subject: [PATCH 07/10] Add test for #601

Fixes #601 even though this code only adds a test
---
 ccdproc/tests/test_image_collection.py | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)

diff --git a/ccdproc/tests/test_image_collection.py b/ccdproc/tests/test_image_collection.py
index 2f922cfb..1738dc69 100644
--- a/ccdproc/tests/test_image_collection.py
+++ b/ccdproc/tests/test_image_collection.py
@@ -989,3 +989,27 @@ def test_less_strict_verify_option(self, triage_setup):
         # Try making the summary as in the original bug report
         ic = ImageFileCollection(location=str(path),
                                  glob_include='*warnA*')
+
+    def test_type_of_empty_collection(self, triage_setup):
+        # Test for implementation of the suggestion in
+        #
+        #    https://github.com/astropy/ccdproc/issues/601
+        #
+        # in which an empty collection with no keys has but with files
+        # returns a summary table with one column, but an empty collection
+        # with no keys and no files returns None.
+
+        # Make a dummy keyword that we then delete.
+        ic = ImageFileCollection(triage_setup.test_dir, keywords=['fafa'])
+        ic.keywords = []
+        assert set(ic.summary.colnames) == set(['file'])
+
+        # Remove all of the fits files
+        path = Path(triage_setup.test_dir)
+        for p in path.iterdir():
+            p.unlink()
+
+        # Now the summary should be none
+        ic = ImageFileCollection(triage_setup.test_dir)
+        assert ic.summary is None
+        assert ic.keywords == []

From 531454cc4f0701853fc366e56c10867951e8187a Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 19:22:50 -0400
Subject: [PATCH 08/10] Fix dtype tests on Windows

---
 ccdproc/tests/test_image_collection.py | 11 ++++++++---
 1 file changed, 8 insertions(+), 3 deletions(-)

diff --git a/ccdproc/tests/test_image_collection.py b/ccdproc/tests/test_image_collection.py
index 1738dc69..583807a8 100644
--- a/ccdproc/tests/test_image_collection.py
+++ b/ccdproc/tests/test_image_collection.py
@@ -890,10 +890,15 @@ def test_image_collection_with_no_location(self, triage_setup):
 
             # Spot check a couple of dtypes as a test for
             #   https://github.com/astropy/ccdproc/issues/662
-
             assert ic.summary['extend'].dtype == 'bool'
-            assert ic.summary['naxis1'].dtype == 'int64'
-            assert ic.summary['exptime'].dtype == 'float64'
+
+            # Of course, default dtypes on Windows are different. So instead
+            # of comparing to something sensible like int64, compare to the
+            # default int dtype.
+            assert ic.summary['naxis1'].dtype == np.array([5]).dtype
+
+            # and the default float dtype
+            assert ic.summary['exptime'].dtype == np.array([5.0]).dtype
 
             expected_heads = (actual['imagetyp'] == 'LIGHT').sum()
 

From b90078c64bfc2f28ae6620c8819337c7a26cf3b0 Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 19:41:18 -0400
Subject: [PATCH 09/10] Address review comments

---
 ccdproc/image_collection.py       | 8 ++++----
 docs/ccdproc/image_management.rst | 2 +-
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/ccdproc/image_collection.py b/ccdproc/image_collection.py
index 20663182..26f817c4 100644
--- a/ccdproc/image_collection.py
+++ b/ccdproc/image_collection.py
@@ -722,12 +722,12 @@ def _fits_files_in_directory(self, extensions=None,
             for extension in full_extensions:
                 files.extend(fnmatch.filter(all_files, '*' + extension))
         else:
-            for file in all_files:
-                with open(file, 'rb') as fp:
+            for infile in all_files:
+                with open(infile, 'rb') as fp:
                     # Hmm, first argument to is_fits is not actually used in
                     # that function. *shrug*
-                    if fits.connect.is_fits('just some junk', file, fp):
-                        files.append(file)
+                    if fits.connect.is_fits('just some junk', infile, fp):
+                        files.append(infile)
 
         files.sort()
         return files
diff --git a/docs/ccdproc/image_management.rst b/docs/ccdproc/image_management.rst
index 83960116..f97e58c9 100644
--- a/docs/ccdproc/image_management.rst
+++ b/docs/ccdproc/image_management.rst
@@ -49,7 +49,7 @@ not ones that include the word ``bad``, you could do::
 
 Alternatively, you can create the collection with an explicit list of file names::
 
-    >>> ic_names = ImageFileCollection(filenames=['a.fits', 'b.fits.gz'])
+    >>> ic_names = ImageFileCollection(filenames=['a.fits', '/some/path/b.fits.gz'])
 
 Most of the useful interaction with the image collection is via its
 ``.summary`` property, a :class:`~astropy.table.Table` of the value of each keyword for each

From 4fe96b1d629d1f1df804a424483255a854178220 Mon Sep 17 00:00:00 2001
From: Matthew Craig <mattwcraig@gmail.com>
Date: Fri, 26 Jul 2019 19:52:08 -0400
Subject: [PATCH 10/10] Add change log entry

---
 CHANGES.rst | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/CHANGES.rst b/CHANGES.rst
index 864425a2..3d6a9943 100644
--- a/CHANGES.rst
+++ b/CHANGES.rst
@@ -4,6 +4,12 @@
 New Features
 ^^^^^^^^^^^^
 
+- Allow initialization of ``ImageFileCollection`` from a list of files with no
+  location set. [#374, #661, #680]
+
+- Allow identification of FITS files in ``ImageFileCollection`` based on content
+  of the files instead of file name extension. [#620, #680]
+
 Other Changes and Additions
 ^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
@@ -19,8 +25,15 @@ Other Changes and Additions
 
 - Added support for .bz2, .Z and .zip file formats in ``ImageFileCollection``.
 
+- Removed support for initializing ``ImageFileCollection`` from a table instead
+  of files. [#680]
+
+- More consistent typing of ``ImageFileCollection.summary`` when the collection
+  is empty. [#601, #680]
+
 Bug Fixes
 ^^^^^^^^^
+
 - Function ``median_combine`` now correctly calculates the uncertainty for
   masked ``CCDData``. [#608]
 
@@ -29,6 +42,9 @@ Bug Fixes
 - Raise ``ValueError`` error in ``subtract_dark`` for when the errors have
   different shapes [#674, #677]
 
+- Fix problem with column dtypes when initializing ``ImageFileCollection`` from
+  a list of file names. [#662, #680]
+
 1.3.0 (2017-11-1)
 -----------------